diff --git a/.gitattributes b/.gitattributes
index a6344aac8c09253b3b630fb776ae94478aa0275b..52373fe24473b1aa44333d318f578ae6bf04b49b 100644
--- a/.gitattributes
+++ b/.gitattributes
@@ -33,3 +33,4 @@ saved_model/**/* filter=lfs diff=lfs merge=lfs -text
*.zip filter=lfs diff=lfs merge=lfs -text
*.zst filter=lfs diff=lfs merge=lfs -text
*tfevents* filter=lfs diff=lfs merge=lfs -text
+tokenizer.json filter=lfs diff=lfs merge=lfs -text
diff --git a/README.md b/README.md
new file mode 100644
index 0000000000000000000000000000000000000000..4c192fb495da2b7b34030deda13f226c99060650
--- /dev/null
+++ b/README.md
@@ -0,0 +1,57 @@
+---
+language:
+- en
+- zh
+library_name: transformers
+license: mit
+pipeline_tag: text-generation
+---
+
+# GLM-4.6-FP8
+
+
+

+
+
+ ๐ Join our Discord community.
+
+ ๐ Check out the GLM-4.6 technical blog, technical report(GLM-4.5), and Zhipu AI technical documentation.
+
+ ๐ Use GLM-4.6 API services on Z.ai API Platform.
+
+ ๐ One click to GLM-4.6.
+
+
+## Model Introduction
+
+Compared with GLM-4.5, **GLM-4.6** brings several key improvements:
+
+* **Longer context window:** The context window has been expanded from 128K to 200K tokens, enabling the model to handle more complex agentic tasks.
+* **Superior coding performance:** The model achieves higher scores on code benchmarks and demonstrates better real-world performance in applications such as Claude CodeใClineใRoo Code and Kilo Code, including improvements in generating visually polished front-end pages.
+* **Advanced reasoning:** GLM-4.6 shows a clear improvement in reasoning performance and supports tool use during inference, leading to stronger overall capability.
+* **More capable agents:** GLM-4.6 exhibits stronger performance in tool using and search-based agents, and integrates more effectively within agent frameworks.
+* **Refined writing:** Better aligns with human preferences in style and readability, and performs more naturally in role-playing scenarios.
+
+We evaluated GLM-4.6 across eight public benchmarks covering agents, reasoning, and coding. Results show clear gains over GLM-4.5, with GLM-4.6 also holding competitive advantages over leading domestic and international models such as **DeepSeek-V3.1-Terminus** and **Claude Sonnet 4**.
+
+
+
+## Inference
+
+**Both GLM-4.5 and GLM-4.6 use the same inference method.**
+
+you can check our [github](https://github.com/zai-org/GLM-4.5) for more detail.
+
+## Recommended Evaluation Parameters
+
+For general evaluations, we recommend using a **sampling temperature of 1.0**.
+
+For **code-related evaluation tasks** (such as LCB), it is further recommended to set:
+
+- `top_p = 0.95`
+- `top_k = 40`
+
+## Evaluation
+
+- For tool-integrated reasoning, please refer to [this doc](https://github.com/zai-org/GLM-4.5/blob/main/resources/glm_4.6_tir_guide.md).
+- For search benchmark, we design a specific format for searching toolcall in thinking mode to support search agent, please refer to [this](https://github.com/zai-org/GLM-4.5/blob/main/resources/trajectory_search.json). for the detailed template.
diff --git a/chat_template.jinja b/chat_template.jinja
new file mode 100644
index 0000000000000000000000000000000000000000..41478957aca7a04b7321022e7d1f73de5badd995
--- /dev/null
+++ b/chat_template.jinja
@@ -0,0 +1,103 @@
+[gMASK]
+{%- if tools -%}
+<|system|>
+# Tools
+
+You may call one or more functions to assist with the user query.
+
+You are provided with function signatures within XML tags:
+
+{% for tool in tools %}
+{{ tool | tojson(ensure_ascii=False) }}
+{% endfor %}
+
+
+For each function call, output the function name and arguments within the following XML format:
+{function-name}
+{arg-key-1}
+{arg-value-1}
+{arg-key-2}
+{arg-value-2}
+...
+{%- endif -%}
+{%- macro visible_text(content) -%}
+ {%- if content is string -%}
+ {{- content }}
+ {%- elif content is iterable and content is not mapping -%}
+ {%- for item in content -%}
+ {%- if item is mapping and item.type == 'text' -%}
+ {{- item.text }}
+ {%- elif item is string -%}
+ {{- item }}
+ {%- endif -%}
+ {%- endfor -%}
+ {%- else -%}
+ {{- content }}
+ {%- endif -%}
+{%- endmacro -%}
+{%- set ns = namespace(last_user_index=-1) %}
+{%- for m in messages %}
+ {%- if m.role == 'user' %}
+ {% set ns.last_user_index = loop.index0 -%}
+ {%- endif %}
+{%- endfor %}
+{% for m in messages %}
+{%- if m.role == 'user' -%}<|user|>
+{{ visible_text(m.content) }}
+{{- '/nothink' if (enable_thinking is defined and not enable_thinking and not visible_text(m.content).endswith("/nothink")) else '' -}}
+{%- elif m.role == 'assistant' -%}
+<|assistant|>
+{%- set reasoning_content = '' %}
+{%- set content = visible_text(m.content) %}
+{%- if m.reasoning_content is string %}
+ {%- set reasoning_content = m.reasoning_content %}
+{%- else %}
+ {%- if '' in content %}
+ {%- set reasoning_content = content.split('')[0].rstrip('\n').split('')[-1].lstrip('\n') %}
+ {%- set content = content.split('')[-1].lstrip('\n') %}
+ {%- endif %}
+{%- endif %}
+{%- if loop.index0 > ns.last_user_index and reasoning_content -%}
+{{ '\n' + reasoning_content.strip() + ''}}
+{%- else -%}
+{{ '\n' }}
+{%- endif -%}
+{%- if content.strip() -%}
+{{ '\n' + content.strip() }}
+{%- endif -%}
+{% if m.tool_calls %}
+{% for tc in m.tool_calls %}
+{%- if tc.function %}
+ {%- set tc = tc.function %}
+{%- endif %}
+{{ '\n' + tc.name }}
+{% set _args = tc.arguments %}
+{% for k, v in _args.items() %}
+{{ k }}
+{{ v | tojson(ensure_ascii=False) if v is not string else v }}
+{% endfor %}
+{% endfor %}
+{% endif %}
+{%- elif m.role == 'tool' -%}
+{%- if m.content is string -%}
+{%- if loop.first or (messages[loop.index0 - 1].role != "tool") %}
+ {{- '<|observation|>' }}
+{%- endif %}
+{{- '\n\n' }}
+{{- m.content }}
+{{- '\n' }}
+{%- else -%}
+<|observation|>{% for tr in m.content %}
+
+
+{{ tr.output if tr.output is defined else tr }}
+{% endfor -%}
+{% endif -%}
+{%- elif m.role == 'system' -%}
+<|system|>
+{{ visible_text(m.content) }}
+{%- endif -%}
+{%- endfor -%}
+{%- if add_generation_prompt -%}
+ <|assistant|>{{- '\n' if (enable_thinking is defined and not enable_thinking) else '' -}}
+{%- endif -%}
\ No newline at end of file
diff --git a/config.json b/config.json
new file mode 100644
index 0000000000000000000000000000000000000000..2583316dbdba4a193a7560a659add3461848eecd
--- /dev/null
+++ b/config.json
@@ -0,0 +1,921 @@
+{
+ "architectures": [
+ "Glm4MoeForCausalLM"
+ ],
+ "attention_bias": true,
+ "attention_dropout": 0.0,
+ "pad_token_id": 151329,
+ "eos_token_id": [
+ 151329,
+ 151336,
+ 151338
+ ],
+ "head_dim": 128,
+ "hidden_act": "silu",
+ "hidden_size": 5120,
+ "partial_rotary_factor": 0.5,
+ "initializer_range": 0.02,
+ "intermediate_size": 12288,
+ "max_position_embeddings": 202752,
+ "model_type": "glm4_moe",
+ "moe_intermediate_size": 1536,
+ "norm_topk_prob": true,
+ "num_attention_heads": 96,
+ "n_group": 1,
+ "topk_group": 1,
+ "n_routed_experts": 160,
+ "n_shared_experts": 1,
+ "routed_scaling_factor": 2.5,
+ "num_experts_per_tok": 8,
+ "first_k_dense_replace": 3,
+ "num_hidden_layers": 92,
+ "num_key_value_heads": 8,
+ "rms_norm_eps": 1e-05,
+ "rope_scaling": null,
+ "rope_theta": 1000000,
+ "num_nextn_predict_layers": 1,
+ "tie_word_embeddings": false,
+ "torch_dtype": "bfloat16",
+ "transformers_version": "4.54.0",
+ "use_cache": true,
+ "use_qk_norm": true,
+ "vocab_size": 151552,
+ "quantization_config": {
+ "config_groups": {
+ "group_0": {
+ "input_activations": {
+ "actorder": null,
+ "block_structure": null,
+ "dynamic": true,
+ "group_size": null,
+ "num_bits": 8,
+ "observer": null,
+ "observer_kwargs": {},
+ "strategy": "token",
+ "symmetric": true,
+ "type": "float"
+ },
+ "output_activations": null,
+ "targets": [
+ "Linear"
+ ],
+ "weights": {
+ "actorder": null,
+ "block_structure": null,
+ "dynamic": false,
+ "group_size": null,
+ "num_bits": 8,
+ "observer": "minmax",
+ "observer_kwargs": {},
+ "strategy": "channel",
+ "symmetric": true,
+ "type": "float"
+ }
+ }
+ },
+ "format": "float-quantized",
+ "ignore": [
+ "model.layers.12.input_layernorm",
+ "model.layers.48.input_layernorm",
+ "model.layers.74.input_layernorm",
+ "model.layers.5.self_attn.q_norm",
+ "model.layers.11.self_attn.k_proj.bias",
+ "model.layers.3.self_attn.k_proj.bias",
+ "model.layers.53.self_attn.q_norm",
+ "model.layers.52.mlp.gate",
+ "model.layers.29.mlp.gate.e_score_correction_bias",
+ "model.layers.34.post_attention_layernorm",
+ "model.layers.88.post_attention_layernorm",
+ "model.layers.17.input_layernorm",
+ "model.layers.37.self_attn.k_norm",
+ "model.layers.9.mlp.gate.e_score_correction_bias",
+ "model.layers.17.self_attn.v_proj.bias",
+ "model.layers.82.self_attn.q_norm",
+ "model.layers.41.mlp.gate",
+ "model.layers.73.input_layernorm",
+ "model.layers.72.input_layernorm",
+ "model.layers.61.post_attention_layernorm",
+ "model.layers.30.input_layernorm",
+ "model.layers.80.mlp.gate",
+ "model.layers.14.input_layernorm",
+ "model.layers.45.self_attn.k_norm",
+ "model.layers.55.mlp.gate",
+ "model.layers.9.input_layernorm",
+ "model.layers.13.input_layernorm",
+ "model.layers.47.self_attn.q_proj.bias",
+ "model.layers.84.post_attention_layernorm",
+ "model.layers.85.self_attn.q_norm",
+ "model.layers.53.self_attn.v_proj.bias",
+ "model.layers.83.self_attn.v_proj.bias",
+ "model.layers.35.self_attn.v_proj.bias",
+ "model.layers.76.mlp.gate.e_score_correction_bias",
+ "model.layers.36.input_layernorm",
+ "model.layers.13.post_attention_layernorm",
+ "model.layers.71.self_attn.k_proj.bias",
+ "model.layers.84.mlp.gate.e_score_correction_bias",
+ "model.layers.46.self_attn.k_norm",
+ "model.layers.50.self_attn.q_norm",
+ "model.layers.59.self_attn.q_proj.bias",
+ "model.layers.5.input_layernorm",
+ "model.layers.29.mlp.gate",
+ "model.layers.73.self_attn.q_norm",
+ "model.layers.27.mlp.gate",
+ "model.layers.49.post_attention_layernorm",
+ "model.layers.63.self_attn.q_proj.bias",
+ "model.layers.7.self_attn.q_proj.bias",
+ "model.layers.5.self_attn.k_proj.bias",
+ "model.layers.70.self_attn.q_proj.bias",
+ "model.layers.70.self_attn.k_norm",
+ "model.layers.15.self_attn.q_proj.bias",
+ "model.layers.59.self_attn.q_norm",
+ "model.layers.89.self_attn.k_proj.bias",
+ "model.layers.89.self_attn.q_norm",
+ "model.layers.42.mlp.gate.e_score_correction_bias",
+ "model.layers.62.self_attn.q_norm",
+ "model.layers.18.input_layernorm",
+ "model.layers.79.post_attention_layernorm",
+ "model.layers.63.self_attn.k_norm",
+ "model.layers.58.input_layernorm",
+ "model.layers.57.mlp.gate",
+ "model.layers.32.self_attn.q_norm",
+ "model.layers.34.self_attn.v_proj.bias",
+ "model.layers.83.self_attn.k_proj.bias",
+ "model.layers.7.input_layernorm",
+ "model.layers.72.self_attn.k_norm",
+ "model.layers.55.self_attn.v_proj.bias",
+ "model.layers.2.self_attn.k_proj.bias",
+ "model.layers.23.post_attention_layernorm",
+ "model.layers.60.post_attention_layernorm",
+ "model.layers.33.self_attn.k_proj.bias",
+ "model.layers.85.self_attn.k_proj.bias",
+ "model.layers.83.mlp.gate.e_score_correction_bias",
+ "model.layers.20.self_attn.k_proj.bias",
+ "model.layers.11.mlp.gate",
+ "model.layers.82.input_layernorm",
+ "model.layers.83.self_attn.q_norm",
+ "model.layers.9.post_attention_layernorm",
+ "model.layers.55.mlp.gate.e_score_correction_bias",
+ "model.layers.21.mlp.gate",
+ "model.layers.41.mlp.gate.e_score_correction_bias",
+ "model.layers.10.mlp.gate.e_score_correction_bias",
+ "model.layers.49.mlp.gate",
+ "model.layers.56.self_attn.k_norm",
+ "model.layers.86.self_attn.q_norm",
+ "model.layers.89.input_layernorm",
+ "model.layers.16.input_layernorm",
+ "model.layers.25.mlp.gate.e_score_correction_bias",
+ "model.layers.8.self_attn.k_norm",
+ "model.layers.72.post_attention_layernorm",
+ "model.layers.92.self_attn.q_norm",
+ "model.layers.73.post_attention_layernorm",
+ "model.layers.71.mlp.gate.e_score_correction_bias",
+ "model.layers.42.input_layernorm",
+ "model.layers.25.self_attn.k_norm",
+ "model.layers.50.self_attn.q_proj.bias",
+ "model.layers.13.self_attn.k_norm",
+ "model.layers.65.mlp.gate.e_score_correction_bias",
+ "model.layers.9.self_attn.k_norm",
+ "model.layers.3.input_layernorm",
+ "model.layers.90.self_attn.q_proj.bias",
+ "model.layers.35.self_attn.q_norm",
+ "model.layers.74.mlp.gate",
+ "model.layers.21.self_attn.k_norm",
+ "model.layers.92.mlp.gate",
+ "model.layers.15.mlp.gate.e_score_correction_bias",
+ "model.layers.61.self_attn.k_proj.bias",
+ "model.layers.63.self_attn.q_norm",
+ "model.layers.73.self_attn.q_proj.bias",
+ "model.layers.18.self_attn.q_norm",
+ "model.layers.45.mlp.gate",
+ "model.layers.52.self_attn.v_proj.bias",
+ "model.layers.22.post_attention_layernorm",
+ "model.layers.85.self_attn.q_proj.bias",
+ "model.layers.3.self_attn.k_norm",
+ "model.layers.54.self_attn.v_proj.bias",
+ "model.layers.79.self_attn.v_proj.bias",
+ "model.layers.31.self_attn.q_proj.bias",
+ "model.layers.2.input_layernorm",
+ "model.layers.57.self_attn.q_norm",
+ "model.layers.65.self_attn.k_norm",
+ "model.layers.60.input_layernorm",
+ "model.layers.70.self_attn.v_proj.bias",
+ "model.layers.87.post_attention_layernorm",
+ "model.layers.83.post_attention_layernorm",
+ "model.layers.51.self_attn.k_proj.bias",
+ "model.layers.23.self_attn.k_norm",
+ "model.layers.49.self_attn.k_norm",
+ "model.layers.76.self_attn.k_proj.bias",
+ "model.layers.7.self_attn.q_norm",
+ "model.layers.54.mlp.gate",
+ "model.layers.63.post_attention_layernorm",
+ "model.layers.27.self_attn.k_proj.bias",
+ "model.layers.81.input_layernorm",
+ "model.layers.66.post_attention_layernorm",
+ "model.layers.84.self_attn.q_proj.bias",
+ "model.layers.36.self_attn.k_proj.bias",
+ "model.layers.30.self_attn.v_proj.bias",
+ "model.layers.48.self_attn.k_norm",
+ "model.layers.62.mlp.gate",
+ "model.layers.8.mlp.gate",
+ "model.layers.11.mlp.gate.e_score_correction_bias",
+ "model.layers.28.mlp.gate",
+ "model.layers.30.mlp.gate.e_score_correction_bias",
+ "model.layers.43.input_layernorm",
+ "model.layers.3.self_attn.q_proj.bias",
+ "model.layers.88.input_layernorm",
+ "model.layers.5.post_attention_layernorm",
+ "model.layers.35.self_attn.k_norm",
+ "model.layers.56.post_attention_layernorm",
+ "model.layers.30.mlp.gate",
+ "model.layers.67.self_attn.q_proj.bias",
+ "model.layers.58.post_attention_layernorm",
+ "model.layers.80.post_attention_layernorm",
+ "model.layers.88.self_attn.v_proj.bias",
+ "model.layers.90.self_attn.v_proj.bias",
+ "model.layers.2.self_attn.k_norm",
+ "model.layers.67.mlp.gate.e_score_correction_bias",
+ "model.layers.31.input_layernorm",
+ "model.layers.26.post_attention_layernorm",
+ "model.layers.81.self_attn.k_proj.bias",
+ "model.layers.51.self_attn.q_norm",
+ "model.layers.7.self_attn.k_proj.bias",
+ "model.layers.76.self_attn.q_proj.bias",
+ "model.layers.1.self_attn.k_norm",
+ "model.layers.34.mlp.gate.e_score_correction_bias",
+ "model.layers.80.self_attn.k_proj.bias",
+ "model.layers.0.self_attn.k_norm",
+ "model.layers.44.self_attn.q_norm",
+ "model.layers.29.input_layernorm",
+ "model.layers.77.self_attn.v_proj.bias",
+ "model.layers.73.mlp.gate",
+ "model.layers.31.self_attn.v_proj.bias",
+ "model.layers.46.self_attn.q_proj.bias",
+ "model.layers.62.self_attn.k_norm",
+ "model.layers.87.self_attn.k_proj.bias",
+ "model.layers.58.self_attn.k_norm",
+ "model.layers.66.mlp.gate.e_score_correction_bias",
+ "model.layers.32.mlp.gate.e_score_correction_bias",
+ "model.layers.73.self_attn.k_proj.bias",
+ "model.layers.85.mlp.gate.e_score_correction_bias",
+ "model.layers.23.mlp.gate",
+ "model.layers.72.self_attn.q_proj.bias",
+ "model.layers.25.mlp.gate",
+ "model.layers.43.mlp.gate.e_score_correction_bias",
+ "model.layers.50.mlp.gate.e_score_correction_bias",
+ "model.layers.6.mlp.gate.e_score_correction_bias",
+ "model.layers.14.mlp.gate",
+ "model.layers.50.self_attn.v_proj.bias",
+ "model.layers.33.self_attn.k_norm",
+ "model.layers.92.self_attn.q_proj.bias",
+ "model.layers.6.self_attn.k_proj.bias",
+ "model.layers.43.mlp.gate",
+ "model.layers.68.self_attn.q_proj.bias",
+ "model.layers.33.self_attn.v_proj.bias",
+ "model.layers.41.self_attn.k_norm",
+ "model.layers.32.self_attn.k_norm",
+ "model.layers.28.post_attention_layernorm",
+ "model.layers.61.self_attn.v_proj.bias",
+ "model.layers.16.post_attention_layernorm",
+ "model.layers.48.mlp.gate.e_score_correction_bias",
+ "model.layers.4.self_attn.v_proj.bias",
+ "model.layers.88.self_attn.k_norm",
+ "model.layers.68.self_attn.k_norm",
+ "model.layers.77.self_attn.q_proj.bias",
+ "model.layers.8.self_attn.v_proj.bias",
+ "model.layers.20.mlp.gate.e_score_correction_bias",
+ "model.layers.86.self_attn.k_norm",
+ "model.layers.36.self_attn.v_proj.bias",
+ "model.layers.71.input_layernorm",
+ "model.layers.72.mlp.gate",
+ "model.layers.24.self_attn.k_norm",
+ "model.layers.20.self_attn.q_norm",
+ "model.layers.62.post_attention_layernorm",
+ "model.layers.3.self_attn.v_proj.bias",
+ "model.layers.25.input_layernorm",
+ "model.layers.20.self_attn.v_proj.bias",
+ "model.layers.64.self_attn.v_proj.bias",
+ "model.layers.19.self_attn.k_proj.bias",
+ "model.layers.63.mlp.gate.e_score_correction_bias",
+ "model.layers.92.embed_tokens",
+ "model.layers.62.self_attn.q_proj.bias",
+ "model.layers.69.self_attn.q_norm",
+ "model.layers.9.mlp.gate",
+ "model.layers.62.mlp.gate.e_score_correction_bias",
+ "model.layers.35.self_attn.k_proj.bias",
+ "model.layers.1.self_attn.q_proj.bias",
+ "model.layers.40.self_attn.q_norm",
+ "model.layers.26.input_layernorm",
+ "model.layers.50.self_attn.k_proj.bias",
+ "model.layers.39.input_layernorm",
+ "model.layers.28.self_attn.k_proj.bias",
+ "model.layers.39.self_attn.q_proj.bias",
+ "model.layers.5.mlp.gate",
+ "model.layers.56.input_layernorm",
+ "model.layers.60.self_attn.k_norm",
+ "model.layers.76.self_attn.q_norm",
+ "lm_head",
+ "model.layers.69.self_attn.k_norm",
+ "model.layers.23.self_attn.q_proj.bias",
+ "model.layers.58.self_attn.q_proj.bias",
+ "model.norm",
+ "model.layers.53.self_attn.k_proj.bias",
+ "model.layers.73.self_attn.v_proj.bias",
+ "model.layers.33.self_attn.q_proj.bias",
+ "model.layers.64.input_layernorm",
+ "model.layers.15.mlp.gate",
+ "model.layers.55.self_attn.q_proj.bias",
+ "model.layers.55.self_attn.k_norm",
+ "model.layers.27.mlp.gate.e_score_correction_bias",
+ "model.layers.68.input_layernorm",
+ "model.layers.30.self_attn.q_norm",
+ "model.layers.82.post_attention_layernorm",
+ "model.layers.29.self_attn.q_proj.bias",
+ "model.layers.79.self_attn.k_proj.bias",
+ "model.layers.16.self_attn.k_proj.bias",
+ "model.layers.71.self_attn.k_norm",
+ "model.layers.16.self_attn.k_norm",
+ "model.layers.75.self_attn.k_proj.bias",
+ "model.layers.52.self_attn.q_norm",
+ "model.layers.87.self_attn.v_proj.bias",
+ "model.layers.23.self_attn.k_proj.bias",
+ "model.layers.24.post_attention_layernorm",
+ "model.layers.40.self_attn.q_proj.bias",
+ "model.layers.46.mlp.gate.e_score_correction_bias",
+ "model.layers.54.input_layernorm",
+ "model.layers.75.post_attention_layernorm",
+ "model.layers.72.self_attn.k_proj.bias",
+ "model.layers.82.self_attn.q_proj.bias",
+ "model.layers.75.mlp.gate.e_score_correction_bias",
+ "model.layers.27.self_attn.q_norm",
+ "model.layers.39.self_attn.q_norm",
+ "model.layers.45.self_attn.k_proj.bias",
+ "model.layers.90.self_attn.k_proj.bias",
+ "model.layers.65.self_attn.q_proj.bias",
+ "model.layers.5.self_attn.k_norm",
+ "model.layers.89.self_attn.q_proj.bias",
+ "model.layers.10.self_attn.k_proj.bias",
+ "model.layers.86.self_attn.v_proj.bias",
+ "model.layers.89.mlp.gate.e_score_correction_bias",
+ "model.layers.42.self_attn.k_norm",
+ "model.layers.57.self_attn.k_proj.bias",
+ "model.layers.68.post_attention_layernorm",
+ "model.layers.1.self_attn.v_proj.bias",
+ "model.layers.38.self_attn.k_proj.bias",
+ "model.layers.75.self_attn.v_proj.bias",
+ "model.layers.44.self_attn.q_proj.bias",
+ "model.layers.8.mlp.gate.e_score_correction_bias",
+ "model.layers.55.input_layernorm",
+ "model.layers.7.self_attn.v_proj.bias",
+ "model.layers.51.self_attn.k_norm",
+ "model.layers.19.mlp.gate",
+ "model.layers.12.self_attn.q_norm",
+ "model.layers.78.self_attn.k_norm",
+ "model.layers.61.self_attn.q_norm",
+ "model.layers.18.mlp.gate",
+ "model.layers.8.self_attn.q_norm",
+ "model.layers.7.self_attn.k_norm",
+ "model.layers.84.self_attn.q_norm",
+ "model.layers.44.self_attn.k_proj.bias",
+ "model.layers.38.self_attn.q_proj.bias",
+ "model.layers.37.mlp.gate.e_score_correction_bias",
+ "model.layers.34.mlp.gate",
+ "model.layers.92.eh_proj",
+ "model.layers.75.self_attn.q_proj.bias",
+ "model.layers.61.mlp.gate.e_score_correction_bias",
+ "model.layers.33.mlp.gate.e_score_correction_bias",
+ "model.layers.81.mlp.gate.e_score_correction_bias",
+ "model.layers.47.self_attn.k_proj.bias",
+ "model.layers.72.self_attn.q_norm",
+ "model.layers.62.self_attn.k_proj.bias",
+ "model.layers.33.self_attn.q_norm",
+ "model.layers.24.mlp.gate",
+ "model.layers.51.input_layernorm",
+ "model.layers.42.self_attn.k_proj.bias",
+ "model.layers.43.self_attn.k_norm",
+ "model.layers.46.self_attn.k_proj.bias",
+ "model.layers.66.input_layernorm",
+ "model.layers.31.mlp.gate.e_score_correction_bias",
+ "model.layers.77.post_attention_layernorm",
+ "model.layers.52.self_attn.k_norm",
+ "model.layers.4.mlp.gate",
+ "model.layers.51.post_attention_layernorm",
+ "model.layers.15.self_attn.k_norm",
+ "model.layers.60.self_attn.k_proj.bias",
+ "model.layers.6.self_attn.q_norm",
+ "model.layers.85.mlp.gate",
+ "model.layers.66.self_attn.k_norm",
+ "model.layers.22.self_attn.v_proj.bias",
+ "model.layers.36.self_attn.k_norm",
+ "model.layers.8.input_layernorm",
+ "model.layers.19.mlp.gate.e_score_correction_bias",
+ "model.layers.25.self_attn.k_proj.bias",
+ "model.layers.31.self_attn.q_norm",
+ "model.layers.16.mlp.gate.e_score_correction_bias",
+ "model.layers.57.self_attn.v_proj.bias",
+ "model.layers.35.mlp.gate",
+ "model.layers.75.input_layernorm",
+ "model.layers.2.self_attn.v_proj.bias",
+ "model.layers.9.self_attn.v_proj.bias",
+ "model.layers.80.self_attn.q_proj.bias",
+ "model.layers.19.self_attn.v_proj.bias",
+ "model.layers.4.post_attention_layernorm",
+ "model.layers.65.input_layernorm",
+ "model.layers.82.mlp.gate.e_score_correction_bias",
+ "model.layers.69.post_attention_layernorm",
+ "model.layers.21.self_attn.q_norm",
+ "model.layers.18.post_attention_layernorm",
+ "model.layers.81.self_attn.q_proj.bias",
+ "model.layers.77.input_layernorm",
+ "model.layers.17.self_attn.q_norm",
+ "model.layers.80.input_layernorm",
+ "model.layers.13.mlp.gate.e_score_correction_bias",
+ "model.layers.0.post_attention_layernorm",
+ "model.layers.19.post_attention_layernorm",
+ "model.layers.91.self_attn.v_proj.bias",
+ "model.layers.77.mlp.gate",
+ "model.layers.11.self_attn.q_norm",
+ "model.layers.92.hnorm",
+ "model.layers.11.self_attn.q_proj.bias",
+ "model.layers.47.self_attn.q_norm",
+ "model.layers.42.self_attn.v_proj.bias",
+ "model.layers.90.input_layernorm",
+ "model.layers.78.input_layernorm",
+ "model.layers.11.self_attn.v_proj.bias",
+ "model.layers.80.self_attn.q_norm",
+ "model.layers.83.input_layernorm",
+ "model.layers.43.self_attn.q_norm",
+ "model.layers.91.post_attention_layernorm",
+ "model.layers.50.mlp.gate",
+ "model.layers.48.self_attn.k_proj.bias",
+ "model.layers.70.mlp.gate.e_score_correction_bias",
+ "model.layers.14.self_attn.q_proj.bias",
+ "model.layers.31.self_attn.k_proj.bias",
+ "model.layers.47.self_attn.v_proj.bias",
+ "model.layers.12.self_attn.k_proj.bias",
+ "model.layers.12.mlp.gate",
+ "model.layers.34.self_attn.q_norm",
+ "model.layers.62.self_attn.v_proj.bias",
+ "model.layers.26.mlp.gate.e_score_correction_bias",
+ "model.layers.45.mlp.gate.e_score_correction_bias",
+ "model.layers.77.self_attn.q_norm",
+ "model.layers.47.self_attn.k_norm",
+ "model.layers.53.post_attention_layernorm",
+ "model.layers.7.post_attention_layernorm",
+ "model.layers.90.post_attention_layernorm",
+ "model.layers.40.mlp.gate.e_score_correction_bias",
+ "model.layers.63.input_layernorm",
+ "model.layers.52.mlp.gate.e_score_correction_bias",
+ "model.layers.92.input_layernorm",
+ "model.layers.44.self_attn.v_proj.bias",
+ "model.layers.46.mlp.gate",
+ "model.layers.18.self_attn.k_proj.bias",
+ "model.layers.62.input_layernorm",
+ "model.layers.24.self_attn.v_proj.bias",
+ "model.layers.40.post_attention_layernorm",
+ "model.layers.8.post_attention_layernorm",
+ "model.layers.82.mlp.gate",
+ "model.layers.17.post_attention_layernorm",
+ "model.layers.45.self_attn.v_proj.bias",
+ "model.layers.84.self_attn.k_proj.bias",
+ "model.layers.15.self_attn.k_proj.bias",
+ "model.layers.0.self_attn.q_proj.bias",
+ "model.layers.92.shared_head.norm",
+ "model.layers.51.self_attn.q_proj.bias",
+ "model.layers.22.mlp.gate",
+ "model.layers.4.self_attn.k_norm",
+ "model.layers.84.input_layernorm",
+ "model.layers.30.self_attn.k_proj.bias",
+ "model.layers.12.self_attn.v_proj.bias",
+ "model.layers.37.input_layernorm",
+ "model.layers.37.self_attn.q_norm",
+ "model.layers.45.self_attn.q_norm",
+ "model.layers.72.self_attn.v_proj.bias",
+ "model.layers.64.self_attn.k_norm",
+ "model.layers.43.self_attn.k_proj.bias",
+ "model.layers.38.mlp.gate.e_score_correction_bias",
+ "model.layers.79.input_layernorm",
+ "model.layers.48.mlp.gate",
+ "model.layers.52.self_attn.q_proj.bias",
+ "model.layers.46.self_attn.v_proj.bias",
+ "model.layers.81.mlp.gate",
+ "model.layers.71.self_attn.q_proj.bias",
+ "model.layers.50.self_attn.k_norm",
+ "model.layers.18.self_attn.v_proj.bias",
+ "model.layers.53.input_layernorm",
+ "model.layers.64.self_attn.q_proj.bias",
+ "model.layers.12.self_attn.k_norm",
+ "model.embed_tokens",
+ "model.layers.78.self_attn.k_proj.bias",
+ "model.layers.40.self_attn.k_norm",
+ "model.layers.11.input_layernorm",
+ "model.layers.22.input_layernorm",
+ "model.layers.39.mlp.gate",
+ "model.layers.30.self_attn.k_norm",
+ "model.layers.71.mlp.gate",
+ "model.layers.71.post_attention_layernorm",
+ "model.layers.78.self_attn.q_norm",
+ "model.layers.87.mlp.gate",
+ "model.layers.14.self_attn.q_norm",
+ "model.layers.42.post_attention_layernorm",
+ "model.layers.3.post_attention_layernorm",
+ "model.layers.92.self_attn.k_proj.bias",
+ "model.layers.3.mlp.gate",
+ "model.layers.89.mlp.gate",
+ "model.layers.86.self_attn.k_proj.bias",
+ "model.layers.87.self_attn.q_proj.bias",
+ "model.layers.63.self_attn.k_proj.bias",
+ "model.layers.87.input_layernorm",
+ "model.layers.10.self_attn.q_proj.bias",
+ "model.layers.81.post_attention_layernorm",
+ "model.layers.39.self_attn.v_proj.bias",
+ "model.layers.43.post_attention_layernorm",
+ "model.layers.76.mlp.gate",
+ "model.layers.28.self_attn.v_proj.bias",
+ "model.layers.57.self_attn.q_proj.bias",
+ "model.layers.21.mlp.gate.e_score_correction_bias",
+ "model.layers.75.self_attn.q_norm",
+ "model.layers.58.self_attn.k_proj.bias",
+ "model.layers.52.input_layernorm",
+ "model.layers.0.self_attn.k_proj.bias",
+ "model.layers.78.mlp.gate.e_score_correction_bias",
+ "model.layers.85.self_attn.k_norm",
+ "model.layers.42.self_attn.q_norm",
+ "model.layers.25.self_attn.v_proj.bias",
+ "model.layers.36.post_attention_layernorm",
+ "model.layers.4.self_attn.q_norm",
+ "model.layers.16.self_attn.q_norm",
+ "model.layers.41.self_attn.k_proj.bias",
+ "model.layers.5.self_attn.q_proj.bias",
+ "model.layers.28.self_attn.q_norm",
+ "model.layers.41.self_attn.q_proj.bias",
+ "model.layers.68.mlp.gate.e_score_correction_bias",
+ "model.layers.26.self_attn.k_proj.bias",
+ "model.layers.86.input_layernorm",
+ "model.layers.35.mlp.gate.e_score_correction_bias",
+ "model.layers.69.input_layernorm",
+ "model.layers.77.mlp.gate.e_score_correction_bias",
+ "model.layers.10.self_attn.q_norm",
+ "model.layers.32.post_attention_layernorm",
+ "model.layers.54.self_attn.q_norm",
+ "model.layers.45.post_attention_layernorm",
+ "model.layers.45.input_layernorm",
+ "model.layers.15.post_attention_layernorm",
+ "model.layers.64.post_attention_layernorm",
+ "model.layers.15.self_attn.v_proj.bias",
+ "model.layers.24.self_attn.k_proj.bias",
+ "model.layers.64.self_attn.k_proj.bias",
+ "model.layers.14.post_attention_layernorm",
+ "model.layers.40.mlp.gate",
+ "model.layers.50.input_layernorm",
+ "model.layers.21.self_attn.v_proj.bias",
+ "model.layers.66.self_attn.q_proj.bias",
+ "model.layers.78.mlp.gate",
+ "model.layers.2.self_attn.q_proj.bias",
+ "model.layers.12.self_attn.q_proj.bias",
+ "model.layers.7.mlp.gate",
+ "model.layers.35.post_attention_layernorm",
+ "model.layers.52.post_attention_layernorm",
+ "model.layers.30.post_attention_layernorm",
+ "model.layers.59.input_layernorm",
+ "model.layers.86.post_attention_layernorm",
+ "model.layers.0.self_attn.v_proj.bias",
+ "model.layers.24.mlp.gate.e_score_correction_bias",
+ "model.layers.34.self_attn.k_norm",
+ "model.layers.4.self_attn.k_proj.bias",
+ "model.layers.74.self_attn.q_proj.bias",
+ "model.layers.78.self_attn.v_proj.bias",
+ "model.layers.49.self_attn.q_proj.bias",
+ "model.layers.53.mlp.gate.e_score_correction_bias",
+ "model.layers.60.self_attn.v_proj.bias",
+ "model.layers.59.mlp.gate",
+ "model.layers.61.mlp.gate",
+ "model.layers.26.self_attn.q_norm",
+ "model.layers.1.input_layernorm",
+ "model.layers.33.mlp.gate",
+ "model.layers.91.mlp.gate",
+ "model.layers.26.self_attn.q_proj.bias",
+ "model.layers.83.mlp.gate",
+ "model.layers.12.mlp.gate.e_score_correction_bias",
+ "model.layers.36.self_attn.q_norm",
+ "model.layers.91.mlp.gate.e_score_correction_bias",
+ "model.layers.25.self_attn.q_norm",
+ "model.layers.91.self_attn.k_norm",
+ "model.layers.20.self_attn.k_norm",
+ "model.layers.8.self_attn.k_proj.bias",
+ "model.layers.29.self_attn.v_proj.bias",
+ "model.layers.82.self_attn.k_proj.bias",
+ "model.layers.89.post_attention_layernorm",
+ "model.layers.29.self_attn.k_norm",
+ "model.layers.88.self_attn.q_norm",
+ "model.layers.48.self_attn.q_proj.bias",
+ "model.layers.22.self_attn.k_norm",
+ "model.layers.27.self_attn.q_proj.bias",
+ "model.layers.23.mlp.gate.e_score_correction_bias",
+ "model.layers.1.post_attention_layernorm",
+ "model.layers.29.post_attention_layernorm",
+ "model.layers.58.mlp.gate",
+ "model.layers.27.input_layernorm",
+ "model.layers.66.self_attn.k_proj.bias",
+ "model.layers.87.mlp.gate.e_score_correction_bias",
+ "model.layers.22.self_attn.q_norm",
+ "model.layers.4.mlp.gate.e_score_correction_bias",
+ "model.layers.51.mlp.gate",
+ "model.layers.90.mlp.gate.e_score_correction_bias",
+ "model.layers.3.self_attn.q_norm",
+ "model.layers.33.input_layernorm",
+ "model.layers.91.self_attn.k_proj.bias",
+ "model.layers.8.self_attn.q_proj.bias",
+ "model.layers.12.post_attention_layernorm",
+ "model.layers.3.mlp.gate.e_score_correction_bias",
+ "model.layers.69.mlp.gate.e_score_correction_bias",
+ "model.layers.17.self_attn.k_proj.bias",
+ "model.layers.82.self_attn.k_norm",
+ "model.layers.10.post_attention_layernorm",
+ "model.layers.84.mlp.gate",
+ "model.layers.6.input_layernorm",
+ "model.layers.70.mlp.gate",
+ "model.layers.33.post_attention_layernorm",
+ "model.layers.31.self_attn.k_norm",
+ "model.layers.88.self_attn.q_proj.bias",
+ "model.layers.80.self_attn.k_norm",
+ "model.layers.36.mlp.gate.e_score_correction_bias",
+ "model.layers.56.self_attn.v_proj.bias",
+ "model.layers.1.self_attn.k_proj.bias",
+ "model.layers.44.self_attn.k_norm",
+ "model.layers.60.mlp.gate.e_score_correction_bias",
+ "model.layers.32.self_attn.k_proj.bias",
+ "model.layers.69.self_attn.k_proj.bias",
+ "model.layers.4.input_layernorm",
+ "model.layers.15.self_attn.q_norm",
+ "model.layers.79.self_attn.k_norm",
+ "model.layers.4.self_attn.q_proj.bias",
+ "model.layers.51.mlp.gate.e_score_correction_bias",
+ "model.layers.57.self_attn.k_norm",
+ "model.layers.90.self_attn.k_norm",
+ "model.layers.27.self_attn.k_norm",
+ "model.layers.50.post_attention_layernorm",
+ "model.layers.21.self_attn.q_proj.bias",
+ "model.layers.10.input_layernorm",
+ "model.layers.64.self_attn.q_norm",
+ "model.layers.67.self_attn.k_proj.bias",
+ "model.layers.85.self_attn.v_proj.bias",
+ "model.layers.14.mlp.gate.e_score_correction_bias",
+ "model.layers.32.mlp.gate",
+ "model.layers.67.self_attn.v_proj.bias",
+ "model.layers.26.self_attn.k_norm",
+ "model.layers.19.self_attn.q_norm",
+ "model.layers.22.mlp.gate.e_score_correction_bias",
+ "model.layers.68.self_attn.q_norm",
+ "model.layers.86.mlp.gate.e_score_correction_bias",
+ "model.layers.20.post_attention_layernorm",
+ "model.layers.21.post_attention_layernorm",
+ "model.layers.49.self_attn.v_proj.bias",
+ "model.layers.38.mlp.gate",
+ "model.layers.82.self_attn.v_proj.bias",
+ "model.layers.42.mlp.gate",
+ "model.layers.21.input_layernorm",
+ "model.layers.22.self_attn.k_proj.bias",
+ "model.layers.54.self_attn.q_proj.bias",
+ "model.layers.76.post_attention_layernorm",
+ "model.layers.67.input_layernorm",
+ "model.layers.65.self_attn.v_proj.bias",
+ "model.layers.67.self_attn.q_norm",
+ "model.layers.79.self_attn.q_norm",
+ "model.layers.47.input_layernorm",
+ "model.layers.79.mlp.gate.e_score_correction_bias",
+ "model.layers.76.self_attn.k_norm",
+ "model.layers.60.mlp.gate",
+ "model.layers.20.self_attn.q_proj.bias",
+ "model.layers.11.post_attention_layernorm",
+ "model.layers.24.self_attn.q_norm",
+ "model.layers.53.self_attn.k_norm",
+ "model.layers.53.self_attn.q_proj.bias",
+ "model.layers.75.self_attn.k_norm",
+ "model.layers.28.self_attn.q_proj.bias",
+ "model.layers.65.self_attn.q_norm",
+ "model.layers.39.self_attn.k_proj.bias",
+ "model.layers.85.input_layernorm",
+ "model.layers.17.self_attn.q_proj.bias",
+ "model.layers.65.post_attention_layernorm",
+ "model.layers.68.mlp.gate",
+ "model.layers.13.self_attn.q_norm",
+ "model.layers.81.self_attn.v_proj.bias",
+ "model.layers.58.self_attn.q_norm",
+ "model.layers.34.input_layernorm",
+ "model.layers.25.self_attn.q_proj.bias",
+ "model.layers.77.self_attn.k_proj.bias",
+ "model.layers.39.mlp.gate.e_score_correction_bias",
+ "model.layers.0.input_layernorm",
+ "model.layers.76.self_attn.v_proj.bias",
+ "model.layers.6.self_attn.k_norm",
+ "model.layers.74.self_attn.k_proj.bias",
+ "model.layers.92.self_attn.k_norm",
+ "model.layers.37.self_attn.k_proj.bias",
+ "model.layers.18.self_attn.k_norm",
+ "model.layers.48.self_attn.q_norm",
+ "model.layers.84.self_attn.v_proj.bias",
+ "model.layers.47.mlp.gate.e_score_correction_bias",
+ "model.layers.49.self_attn.q_norm",
+ "model.layers.51.self_attn.v_proj.bias",
+ "model.layers.61.input_layernorm",
+ "model.layers.28.self_attn.k_norm",
+ "model.layers.32.self_attn.v_proj.bias",
+ "model.layers.55.self_attn.q_norm",
+ "model.layers.55.self_attn.k_proj.bias",
+ "model.layers.47.post_attention_layernorm",
+ "model.layers.69.self_attn.q_proj.bias",
+ "model.layers.28.input_layernorm",
+ "model.layers.40.self_attn.v_proj.bias",
+ "model.layers.19.input_layernorm",
+ "model.layers.83.self_attn.q_proj.bias",
+ "model.layers.66.self_attn.v_proj.bias",
+ "model.layers.59.mlp.gate.e_score_correction_bias",
+ "model.layers.23.self_attn.v_proj.bias",
+ "model.layers.0.self_attn.q_norm",
+ "model.layers.5.mlp.gate.e_score_correction_bias",
+ "model.layers.37.self_attn.v_proj.bias",
+ "model.layers.2.post_attention_layernorm",
+ "model.layers.5.self_attn.v_proj.bias",
+ "model.layers.34.self_attn.k_proj.bias",
+ "model.layers.38.self_attn.v_proj.bias",
+ "model.layers.81.self_attn.k_norm",
+ "model.layers.32.input_layernorm",
+ "model.layers.10.self_attn.k_norm",
+ "model.layers.54.self_attn.k_norm",
+ "model.layers.70.input_layernorm",
+ "model.layers.41.self_attn.v_proj.bias",
+ "model.layers.74.post_attention_layernorm",
+ "model.layers.35.input_layernorm",
+ "model.layers.7.mlp.gate.e_score_correction_bias",
+ "model.layers.6.post_attention_layernorm",
+ "model.layers.86.mlp.gate",
+ "model.layers.20.mlp.gate",
+ "model.layers.31.mlp.gate",
+ "model.layers.2.self_attn.q_norm",
+ "model.layers.23.self_attn.q_norm",
+ "model.layers.6.self_attn.q_proj.bias",
+ "model.layers.83.self_attn.k_norm",
+ "model.layers.38.input_layernorm",
+ "model.layers.60.self_attn.q_norm",
+ "model.layers.91.self_attn.q_norm",
+ "model.layers.44.input_layernorm",
+ "model.layers.67.post_attention_layernorm",
+ "model.layers.27.self_attn.v_proj.bias",
+ "model.layers.15.input_layernorm",
+ "model.layers.26.self_attn.v_proj.bias",
+ "model.layers.44.post_attention_layernorm",
+ "model.layers.46.self_attn.q_norm",
+ "model.layers.58.self_attn.v_proj.bias",
+ "model.layers.67.self_attn.k_norm",
+ "model.layers.38.self_attn.k_norm",
+ "model.layers.56.mlp.gate.e_score_correction_bias",
+ "model.layers.73.self_attn.k_norm",
+ "model.layers.80.mlp.gate.e_score_correction_bias",
+ "model.layers.37.self_attn.q_proj.bias",
+ "model.layers.17.mlp.gate",
+ "model.layers.19.self_attn.k_norm",
+ "model.layers.53.mlp.gate",
+ "model.layers.21.self_attn.k_proj.bias",
+ "model.layers.56.self_attn.q_norm",
+ "model.layers.59.self_attn.v_proj.bias",
+ "model.layers.64.mlp.gate.e_score_correction_bias",
+ "model.layers.86.self_attn.q_proj.bias",
+ "model.layers.46.input_layernorm",
+ "model.layers.6.mlp.gate",
+ "model.layers.40.self_attn.k_proj.bias",
+ "model.layers.60.self_attn.q_proj.bias",
+ "model.layers.6.self_attn.v_proj.bias",
+ "model.layers.47.mlp.gate",
+ "model.layers.32.self_attn.q_proj.bias",
+ "model.layers.17.mlp.gate.e_score_correction_bias",
+ "model.layers.29.self_attn.k_proj.bias",
+ "model.layers.44.mlp.gate.e_score_correction_bias",
+ "model.layers.57.mlp.gate.e_score_correction_bias",
+ "model.layers.87.self_attn.q_norm",
+ "model.layers.71.self_attn.q_norm",
+ "model.layers.52.self_attn.k_proj.bias",
+ "model.layers.88.mlp.gate.e_score_correction_bias",
+ "model.layers.68.self_attn.k_proj.bias",
+ "model.layers.16.self_attn.q_proj.bias",
+ "model.layers.48.self_attn.v_proj.bias",
+ "model.layers.74.self_attn.q_norm",
+ "model.layers.34.self_attn.q_proj.bias",
+ "model.layers.1.self_attn.q_norm",
+ "model.layers.63.mlp.gate",
+ "model.layers.92.enorm",
+ "model.layers.14.self_attn.v_proj.bias",
+ "model.layers.54.post_attention_layernorm",
+ "model.layers.41.self_attn.q_norm",
+ "model.layers.37.post_attention_layernorm",
+ "model.layers.61.self_attn.q_proj.bias",
+ "model.layers.91.input_layernorm",
+ "model.layers.11.self_attn.k_norm",
+ "model.layers.43.self_attn.q_proj.bias",
+ "model.layers.18.mlp.gate.e_score_correction_bias",
+ "model.layers.59.post_attention_layernorm",
+ "model.layers.9.self_attn.q_norm",
+ "model.layers.74.self_attn.k_norm",
+ "model.layers.43.self_attn.v_proj.bias",
+ "model.layers.49.self_attn.k_proj.bias",
+ "model.layers.56.self_attn.k_proj.bias",
+ "model.layers.14.self_attn.k_proj.bias",
+ "model.layers.65.mlp.gate",
+ "model.layers.56.self_attn.q_proj.bias",
+ "model.layers.24.self_attn.q_proj.bias",
+ "model.layers.71.self_attn.v_proj.bias",
+ "model.layers.54.mlp.gate.e_score_correction_bias",
+ "model.layers.39.post_attention_layernorm",
+ "model.layers.91.self_attn.q_proj.bias",
+ "model.layers.92.mlp.gate.e_score_correction_bias",
+ "model.layers.46.post_attention_layernorm",
+ "model.layers.92.self_attn.v_proj.bias",
+ "model.layers.63.self_attn.v_proj.bias",
+ "model.layers.25.post_attention_layernorm",
+ "model.layers.45.self_attn.q_proj.bias",
+ "model.layers.38.self_attn.q_norm",
+ "model.layers.68.self_attn.v_proj.bias",
+ "model.layers.69.mlp.gate",
+ "model.layers.84.self_attn.k_norm",
+ "model.layers.19.self_attn.q_proj.bias",
+ "model.layers.38.post_attention_layernorm",
+ "model.layers.44.mlp.gate",
+ "model.layers.70.post_attention_layernorm",
+ "model.layers.58.mlp.gate.e_score_correction_bias",
+ "model.layers.28.mlp.gate.e_score_correction_bias",
+ "model.layers.48.post_attention_layernorm",
+ "model.layers.36.self_attn.q_proj.bias",
+ "model.layers.66.self_attn.q_norm",
+ "model.layers.70.self_attn.k_proj.bias",
+ "model.layers.57.input_layernorm",
+ "model.layers.42.self_attn.q_proj.bias",
+ "model.layers.26.mlp.gate",
+ "model.layers.74.self_attn.v_proj.bias",
+ "model.layers.59.self_attn.k_proj.bias",
+ "model.layers.88.mlp.gate",
+ "model.layers.14.self_attn.k_norm",
+ "model.layers.88.self_attn.k_proj.bias",
+ "model.layers.35.self_attn.q_proj.bias",
+ "model.layers.65.self_attn.k_proj.bias",
+ "model.layers.18.self_attn.q_proj.bias",
+ "model.layers.30.self_attn.q_proj.bias",
+ "model.layers.29.self_attn.q_norm",
+ "model.layers.78.post_attention_layernorm",
+ "model.layers.79.mlp.gate",
+ "model.layers.27.post_attention_layernorm",
+ "model.layers.80.self_attn.v_proj.bias",
+ "model.layers.16.mlp.gate",
+ "model.layers.10.self_attn.v_proj.bias",
+ "model.layers.13.self_attn.v_proj.bias",
+ "model.layers.70.self_attn.q_norm",
+ "model.layers.73.mlp.gate.e_score_correction_bias",
+ "model.layers.41.post_attention_layernorm",
+ "model.layers.39.self_attn.k_norm",
+ "model.layers.10.mlp.gate",
+ "model.layers.36.mlp.gate",
+ "model.layers.92.post_attention_layernorm",
+ "model.layers.64.mlp.gate",
+ "model.layers.40.input_layernorm",
+ "model.layers.77.self_attn.k_norm",
+ "model.layers.31.post_attention_layernorm",
+ "model.layers.56.mlp.gate",
+ "model.layers.16.self_attn.v_proj.bias",
+ "model.layers.9.self_attn.q_proj.bias",
+ "model.layers.13.mlp.gate",
+ "model.layers.17.self_attn.k_norm",
+ "model.layers.22.self_attn.q_proj.bias",
+ "model.layers.49.mlp.gate.e_score_correction_bias",
+ "model.layers.9.self_attn.k_proj.bias",
+ "model.layers.37.mlp.gate",
+ "model.layers.72.mlp.gate.e_score_correction_bias",
+ "model.layers.90.self_attn.q_norm",
+ "model.layers.79.self_attn.q_proj.bias",
+ "model.layers.75.mlp.gate",
+ "model.layers.74.mlp.gate.e_score_correction_bias",
+ "model.layers.89.self_attn.v_proj.bias",
+ "model.layers.59.self_attn.k_norm",
+ "model.layers.76.input_layernorm",
+ "model.layers.66.mlp.gate",
+ "model.layers.55.post_attention_layernorm",
+ "model.layers.24.input_layernorm",
+ "model.layers.57.post_attention_layernorm",
+ "model.layers.23.input_layernorm",
+ "model.layers.67.mlp.gate",
+ "model.layers.13.self_attn.k_proj.bias",
+ "model.layers.69.self_attn.v_proj.bias",
+ "model.layers.85.post_attention_layernorm",
+ "model.layers.13.self_attn.q_proj.bias",
+ "model.layers.87.self_attn.k_norm",
+ "model.layers.89.self_attn.k_norm",
+ "model.layers.54.self_attn.k_proj.bias",
+ "model.layers.49.input_layernorm",
+ "model.layers.78.self_attn.q_proj.bias",
+ "model.layers.81.self_attn.q_norm",
+ "model.layers.41.input_layernorm",
+ "model.layers.90.mlp.gate",
+ "model.layers.61.self_attn.k_norm",
+ "model.layers.20.input_layernorm"
+ ],
+ "quant_method": "compressed-tensors",
+ "quantization_status": "compressed"
+ }
+}
diff --git a/generation_config.json b/generation_config.json
new file mode 100644
index 0000000000000000000000000000000000000000..55942563772385555a04b7be7ce33240c1c2d15e
--- /dev/null
+++ b/generation_config.json
@@ -0,0 +1,11 @@
+{
+ "_from_model_config": true,
+ "eos_token_id": [
+ 151329,
+ 151336,
+ 151338
+ ],
+ "temperature": 1.0,
+ "pad_token_id": 151329,
+ "transformers_version": "4.54.0"
+}
diff --git a/model-00001-of-00092.safetensors b/model-00001-of-00092.safetensors
new file mode 100644
index 0000000000000000000000000000000000000000..eef362e533b32930bbb8d08044d32651362f0085
--- /dev/null
+++ b/model-00001-of-00092.safetensors
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:b36a87481f296d0aa98385f964b7e39ba8b6b3de8d9233484a514b35062dbfec
+size 1877199832
diff --git a/model-00002-of-00092.safetensors b/model-00002-of-00092.safetensors
new file mode 100644
index 0000000000000000000000000000000000000000..7d55fbe645f73bc7608d21922c8d275b2e4c455c
--- /dev/null
+++ b/model-00002-of-00092.safetensors
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:e4377353c9df8c7180bf0d4d876d0a567953a42388771ef110ae144392769555
+size 325307176
diff --git a/model-00003-of-00092.safetensors b/model-00003-of-00092.safetensors
new file mode 100644
index 0000000000000000000000000000000000000000..1a520a23fba5eb97e4511133027d8b3c0c2383cb
--- /dev/null
+++ b/model-00003-of-00092.safetensors
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:894d603e1bace165a158dfed52240a079b9261bfb5f727248c0387a6f7e3393f
+size 325307176
diff --git a/model-00004-of-00092.safetensors b/model-00004-of-00092.safetensors
new file mode 100644
index 0000000000000000000000000000000000000000..9ced60dc38069a7ebe064e489ece8c4fffdc2dab
--- /dev/null
+++ b/model-00004-of-00092.safetensors
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:1cd3fbef0cdd05105dfdd460578e67127b80dd79d151e1595ea0e156548e7e96
+size 3941945016
diff --git a/model-00005-of-00092.safetensors b/model-00005-of-00092.safetensors
new file mode 100644
index 0000000000000000000000000000000000000000..7e67f14b903088457c2d8aba709d981f2d2e232e
--- /dev/null
+++ b/model-00005-of-00092.safetensors
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:52cf9b585c448ef051051449f0298fbcbc564b0cd07477a6f81877105600fbac
+size 3941945016
diff --git a/model-00006-of-00092.safetensors b/model-00006-of-00092.safetensors
new file mode 100644
index 0000000000000000000000000000000000000000..0f272d206a902c6091dac4417b5176577dab994d
--- /dev/null
+++ b/model-00006-of-00092.safetensors
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:9e42ba13d58a14833a5663ea6308de626e7ed2fce0112137a02c2aafa3618a17
+size 3941945016
diff --git a/model-00007-of-00092.safetensors b/model-00007-of-00092.safetensors
new file mode 100644
index 0000000000000000000000000000000000000000..3b54775853a1e94cd34f299ac855c4be2ed712e8
--- /dev/null
+++ b/model-00007-of-00092.safetensors
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:e18797a56cafdaa6af79ed015aeea3b0aaf64f81f502fe8e86b3350970cd7b91
+size 3941945016
diff --git a/model-00008-of-00092.safetensors b/model-00008-of-00092.safetensors
new file mode 100644
index 0000000000000000000000000000000000000000..14788b8aeabab277a400b54bfa5dc81cd99f56f3
--- /dev/null
+++ b/model-00008-of-00092.safetensors
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:3e9f10b8d1ca2a14385fc68c0e3a3afa3c92e7257b97f4b65f541e02a99ceee2
+size 3941945016
diff --git a/model-00009-of-00092.safetensors b/model-00009-of-00092.safetensors
new file mode 100644
index 0000000000000000000000000000000000000000..583d823b8d839570bcd7041852bc3a30c26b6791
--- /dev/null
+++ b/model-00009-of-00092.safetensors
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:7641b05d5a04c9de73e2e2ed3c644c7c8359b5049f219b17c6b50df597cd41b8
+size 3941945016
diff --git a/model-00010-of-00092.safetensors b/model-00010-of-00092.safetensors
new file mode 100644
index 0000000000000000000000000000000000000000..5625e80fd94575acacbc952944a347daf15bc80a
--- /dev/null
+++ b/model-00010-of-00092.safetensors
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:b11e1b5061ad41b414303c354edf6f9eb1306f9766fff524a4042f37843dd7ab
+size 3941945016
diff --git a/model-00011-of-00092.safetensors b/model-00011-of-00092.safetensors
new file mode 100644
index 0000000000000000000000000000000000000000..db103deb6609efe716c53fb97628ba9df402758d
--- /dev/null
+++ b/model-00011-of-00092.safetensors
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:a0ff0e88b6ee8e4a063826b874ddcd2a8ac6554656819163d5b61aa36831ccb2
+size 3941946000
diff --git a/model-00012-of-00092.safetensors b/model-00012-of-00092.safetensors
new file mode 100644
index 0000000000000000000000000000000000000000..9a712d9c99dd3fc373b2bb1e8bc551c29bf6a1fc
--- /dev/null
+++ b/model-00012-of-00092.safetensors
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:6466a2807bf05f0ad9692594253f616562b34a89ab4d6996defa21835c447647
+size 3941946000
diff --git a/model-00013-of-00092.safetensors b/model-00013-of-00092.safetensors
new file mode 100644
index 0000000000000000000000000000000000000000..3d3f660df54da9460a7f2c5f218a400ea3738d17
--- /dev/null
+++ b/model-00013-of-00092.safetensors
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:75ddfa9e346c02cf9aff2067f0110ba70e59cfc475afdee6e900474d9b73f99e
+size 3941946000
diff --git a/model-00014-of-00092.safetensors b/model-00014-of-00092.safetensors
new file mode 100644
index 0000000000000000000000000000000000000000..6d9220876ec9bc59eec7c5717c2e2a251df1f850
--- /dev/null
+++ b/model-00014-of-00092.safetensors
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:9c7dca430e5679422b738125a160d5d484ba55b32db28e2887f85a6cfbcf6b7a
+size 3941946000
diff --git a/model-00015-of-00092.safetensors b/model-00015-of-00092.safetensors
new file mode 100644
index 0000000000000000000000000000000000000000..90b7d1e2ed81867ca40bf33eb63ba8fcdb25af1a
--- /dev/null
+++ b/model-00015-of-00092.safetensors
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:249f98f6d42b67d699c2d244b5df000796e4432bd843f26ab39640597e49686e
+size 3941946000
diff --git a/model-00016-of-00092.safetensors b/model-00016-of-00092.safetensors
new file mode 100644
index 0000000000000000000000000000000000000000..a6b662b48ef5c3f6f64b72f251dbebbc8d6e2e67
--- /dev/null
+++ b/model-00016-of-00092.safetensors
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:b66acc87692b8d8c794ff8fda0e0a2217ef7c9306daa5a90e97b77bdeac24b9c
+size 3941946000
diff --git a/model-00017-of-00092.safetensors b/model-00017-of-00092.safetensors
new file mode 100644
index 0000000000000000000000000000000000000000..dcbec98bf209efeba4a545c8c4231ef2d087488d
--- /dev/null
+++ b/model-00017-of-00092.safetensors
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:361fa81c2ff26252d66f2938de1f0ff91046dffda8a5e85afe2550498e00df01
+size 3941946000
diff --git a/model-00018-of-00092.safetensors b/model-00018-of-00092.safetensors
new file mode 100644
index 0000000000000000000000000000000000000000..7ce031126daf4009f6b0f044306bac7a4fcaf844
--- /dev/null
+++ b/model-00018-of-00092.safetensors
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:d5cf1c834832cae1a0a6800e87621091b57dc6641b57ebc8e75b2e99ab29f9e7
+size 3941946000
diff --git a/model-00019-of-00092.safetensors b/model-00019-of-00092.safetensors
new file mode 100644
index 0000000000000000000000000000000000000000..f37a91370e0fe93a46e6bd345c971363e0de1baf
--- /dev/null
+++ b/model-00019-of-00092.safetensors
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:7fd9d4ea2442838e9911e506233df72589841f81f849b7813e40c770e46ffb37
+size 3941946000
diff --git a/model-00020-of-00092.safetensors b/model-00020-of-00092.safetensors
new file mode 100644
index 0000000000000000000000000000000000000000..ae7068a02a311bd8ffd7fae04d1f36f2e0be164c
--- /dev/null
+++ b/model-00020-of-00092.safetensors
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:805da56848f53fe8ba7b1d4766041176b07050bb2d06636354179420a3ef7a53
+size 3941946000
diff --git a/model-00021-of-00092.safetensors b/model-00021-of-00092.safetensors
new file mode 100644
index 0000000000000000000000000000000000000000..4c26079064a6e0e8e4b4ed1a0299e8420e8d5d29
--- /dev/null
+++ b/model-00021-of-00092.safetensors
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:e70481fdbbb4b013e248a3978635db8149391cba0977b0af00f431bdf368a78b
+size 3941946000
diff --git a/model-00022-of-00092.safetensors b/model-00022-of-00092.safetensors
new file mode 100644
index 0000000000000000000000000000000000000000..9c584190e218a5a6877b8b51782929681b5f085e
--- /dev/null
+++ b/model-00022-of-00092.safetensors
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:522a46ea7d953e8bac1a7ef71ef87d08559cce9181600f59363b4a03a37978ba
+size 3941946000
diff --git a/model-00023-of-00092.safetensors b/model-00023-of-00092.safetensors
new file mode 100644
index 0000000000000000000000000000000000000000..dc810bc8267a36fb06371654cf4d055adb7dae2a
--- /dev/null
+++ b/model-00023-of-00092.safetensors
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:4828ab751880a84b595764ad30da807ae4bfc7d6cd5060a467a5d4ee7c0472f9
+size 3941946000
diff --git a/model-00024-of-00092.safetensors b/model-00024-of-00092.safetensors
new file mode 100644
index 0000000000000000000000000000000000000000..f7536210e2e75896a3c7c9883939bc57b9327e01
--- /dev/null
+++ b/model-00024-of-00092.safetensors
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:dd37f2bd39696f2879e47ee28775f25cb316189f31487c4820ec758ed3eb07e9
+size 3941946000
diff --git a/model-00025-of-00092.safetensors b/model-00025-of-00092.safetensors
new file mode 100644
index 0000000000000000000000000000000000000000..9869108a62c79e1bfa4b01738ec17c2814760862
--- /dev/null
+++ b/model-00025-of-00092.safetensors
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:499cccb499dfe2a7c38413373b9ef4f7aeafcc3adb5273c993b51ecdf66a1af4
+size 3941946000
diff --git a/model-00026-of-00092.safetensors b/model-00026-of-00092.safetensors
new file mode 100644
index 0000000000000000000000000000000000000000..c36c81de5ceb4cd68616c6d4a2dc834332d25382
--- /dev/null
+++ b/model-00026-of-00092.safetensors
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:f74964374efe4e3ebbe44e6c664cfd5e69315ef16479c4fb69ec21494406647f
+size 3941946000
diff --git a/model-00027-of-00092.safetensors b/model-00027-of-00092.safetensors
new file mode 100644
index 0000000000000000000000000000000000000000..7538bad9a24f7ecdb6c2bf50fdb8fb55a5411d9e
--- /dev/null
+++ b/model-00027-of-00092.safetensors
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:f386ccd96a1e9269912c11da13474929ef51a642451017cf71df0403183e3d46
+size 3941946000
diff --git a/model-00028-of-00092.safetensors b/model-00028-of-00092.safetensors
new file mode 100644
index 0000000000000000000000000000000000000000..47b5c4395e90bdc3bfca65b0426e42c419665266
--- /dev/null
+++ b/model-00028-of-00092.safetensors
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:e9607d17b25225d77768fe976e412ac22e58b06ea7e5fedb41c0fb1e7c024aa3
+size 3941946000
diff --git a/model-00029-of-00092.safetensors b/model-00029-of-00092.safetensors
new file mode 100644
index 0000000000000000000000000000000000000000..ade71e46e55a0a07e5c779c1033d5b23d0aca560
--- /dev/null
+++ b/model-00029-of-00092.safetensors
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:90818dcdcef479199d3884e549597ca85eb1459fffb8d3ca1490df655062749e
+size 3941946000
diff --git a/model-00030-of-00092.safetensors b/model-00030-of-00092.safetensors
new file mode 100644
index 0000000000000000000000000000000000000000..d53b3951f701cf9faca6d364eb2071bcda593265
--- /dev/null
+++ b/model-00030-of-00092.safetensors
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:7f5c95e0c676d2e61ca2c2a64a1f93fec730b9e72595d62f341ab69669f4afe6
+size 3941946000
diff --git a/model-00031-of-00092.safetensors b/model-00031-of-00092.safetensors
new file mode 100644
index 0000000000000000000000000000000000000000..75192b3e8191f540d6ac328d4b892f812d394201
--- /dev/null
+++ b/model-00031-of-00092.safetensors
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:a7262032f0ae419b7281c7fe00cdb32da11d1851e25552a0c72426131a195f6a
+size 3941946000
diff --git a/model-00032-of-00092.safetensors b/model-00032-of-00092.safetensors
new file mode 100644
index 0000000000000000000000000000000000000000..f00a028b94f4c36db1efbd8fb34ad53657de6032
--- /dev/null
+++ b/model-00032-of-00092.safetensors
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:d599db91bc26fc7f51e6313ad71eef3e17d9306c70384520caab9a0f3e69d8d3
+size 3941946000
diff --git a/model-00033-of-00092.safetensors b/model-00033-of-00092.safetensors
new file mode 100644
index 0000000000000000000000000000000000000000..9f79aaa4cf6250765ca22914e98b355be3b347ab
--- /dev/null
+++ b/model-00033-of-00092.safetensors
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:4ce02e0c5758d470bb953091aa074414532bbf094ff987c094731ed72de1d178
+size 3941946000
diff --git a/model-00034-of-00092.safetensors b/model-00034-of-00092.safetensors
new file mode 100644
index 0000000000000000000000000000000000000000..cd497c959da5f6c0bebb59c6a6cf32789f6496fc
--- /dev/null
+++ b/model-00034-of-00092.safetensors
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:d26dbb8145811b8312bd1326e99534957c0cb8f14749b468afb526493c54fd4f
+size 3941946000
diff --git a/model-00035-of-00092.safetensors b/model-00035-of-00092.safetensors
new file mode 100644
index 0000000000000000000000000000000000000000..91e0f64487b5ce2f0ac5182c59c9abaa775955e4
--- /dev/null
+++ b/model-00035-of-00092.safetensors
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:e2b95a853acc68338bdc9a25b8a06e95ae9eebe85c95739a6225e81e93d837dd
+size 3941946000
diff --git a/model-00036-of-00092.safetensors b/model-00036-of-00092.safetensors
new file mode 100644
index 0000000000000000000000000000000000000000..c204754b52237f215a2613ca9287eaf6db874644
--- /dev/null
+++ b/model-00036-of-00092.safetensors
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:9ea306c5fb06b73cc99ca0c1a0243047c78c5637d49908d98989fc80adef7623
+size 3941946000
diff --git a/model-00037-of-00092.safetensors b/model-00037-of-00092.safetensors
new file mode 100644
index 0000000000000000000000000000000000000000..975ce023899126031190da13a215d9112eacb06b
--- /dev/null
+++ b/model-00037-of-00092.safetensors
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:2d172e2be799fb9207cfcd35790d5c827ae65cd631432c479b395a4da52c0d27
+size 3941946000
diff --git a/model-00038-of-00092.safetensors b/model-00038-of-00092.safetensors
new file mode 100644
index 0000000000000000000000000000000000000000..046435caafe51a3731a1abae53295842037b44d1
--- /dev/null
+++ b/model-00038-of-00092.safetensors
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:97a20ab8c68afaaf94307353b8115d39be316c2aa1f71433d7cb134a2c598b85
+size 3941946000
diff --git a/model-00039-of-00092.safetensors b/model-00039-of-00092.safetensors
new file mode 100644
index 0000000000000000000000000000000000000000..53134b127ae13cc8f03dde1474950819aadaf10e
--- /dev/null
+++ b/model-00039-of-00092.safetensors
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:8220c62ba76eaa513af60b1cab88303e7d2dda98af483cb603279e2ecf2474d0
+size 3941946000
diff --git a/model-00040-of-00092.safetensors b/model-00040-of-00092.safetensors
new file mode 100644
index 0000000000000000000000000000000000000000..9840abe05e5b5388455c3f173d9031c2cf3c1b32
--- /dev/null
+++ b/model-00040-of-00092.safetensors
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:d977ba19ca442fe854b40ecdf24587241d36f6aa98828bc33e2d1415959b7594
+size 3941946000
diff --git a/model-00041-of-00092.safetensors b/model-00041-of-00092.safetensors
new file mode 100644
index 0000000000000000000000000000000000000000..a766971186b9224cac0cb521fd8af7ab17caaa85
--- /dev/null
+++ b/model-00041-of-00092.safetensors
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:b3a0fb8ea2b84f942e0de29c7a815d03b984758c008c019839578a37dce2c011
+size 3941946000
diff --git a/model-00042-of-00092.safetensors b/model-00042-of-00092.safetensors
new file mode 100644
index 0000000000000000000000000000000000000000..d367ccdbede8478e9759a8424765aff0165be18a
--- /dev/null
+++ b/model-00042-of-00092.safetensors
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:8b5982626470e66a5e3675bf24409bcc6044dafcb9f8ed055b9232252547cee3
+size 3941946000
diff --git a/model-00043-of-00092.safetensors b/model-00043-of-00092.safetensors
new file mode 100644
index 0000000000000000000000000000000000000000..02198e10ba7af68ac6ef1e4823ba82f92c148a89
--- /dev/null
+++ b/model-00043-of-00092.safetensors
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:37ec7e24ee7307a7beb1a186fd2f3505bc3deb955748990acbb0fea2f2cf82fd
+size 3941946000
diff --git a/model-00044-of-00092.safetensors b/model-00044-of-00092.safetensors
new file mode 100644
index 0000000000000000000000000000000000000000..062e8f482e738a1570f5dee7484deee22251a0c3
--- /dev/null
+++ b/model-00044-of-00092.safetensors
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:eec5e6b73a6c0df1f1575154a3e3ed7666adf33803267c30faae7550faa33b68
+size 3941946000
diff --git a/model-00045-of-00092.safetensors b/model-00045-of-00092.safetensors
new file mode 100644
index 0000000000000000000000000000000000000000..e46b5bd75a77f0f08ba438d9066721768a7e2089
--- /dev/null
+++ b/model-00045-of-00092.safetensors
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:8dcd5b45b868f6993d03f3b5664f031937ecbb08d5a9a38b3daf72aab839f361
+size 3941946000
diff --git a/model-00046-of-00092.safetensors b/model-00046-of-00092.safetensors
new file mode 100644
index 0000000000000000000000000000000000000000..e1006cea1a552625019cd625446e07e860f45e46
--- /dev/null
+++ b/model-00046-of-00092.safetensors
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:32fe9214b2e51fc57c6bc180a2f7c90ab949135b8b52e9f926e6abdff6b44e8f
+size 3941946000
diff --git a/model-00047-of-00092.safetensors b/model-00047-of-00092.safetensors
new file mode 100644
index 0000000000000000000000000000000000000000..6499d58ae0c98dad7ae869a7077abfb4537ac92a
--- /dev/null
+++ b/model-00047-of-00092.safetensors
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:07957a95e73bc5c357b31e681b086413417fef3db448596b83a50369e67ca6b2
+size 3941946000
diff --git a/model-00048-of-00092.safetensors b/model-00048-of-00092.safetensors
new file mode 100644
index 0000000000000000000000000000000000000000..27b70720d23867788abfe15e3fc36b9697021e75
--- /dev/null
+++ b/model-00048-of-00092.safetensors
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:c57f1f78fd768a7956c373bcf5a41616e8d01c5358dc8bad51a6477b85a4ec85
+size 3941946000
diff --git a/model-00049-of-00092.safetensors b/model-00049-of-00092.safetensors
new file mode 100644
index 0000000000000000000000000000000000000000..76adf7543484a2db4151eeee9081f67b2fd326ee
--- /dev/null
+++ b/model-00049-of-00092.safetensors
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:86c27727d56f395d7348a0b202d454d40661d1dd1125eebbf37eab1d09f409da
+size 3941946000
diff --git a/model-00050-of-00092.safetensors b/model-00050-of-00092.safetensors
new file mode 100644
index 0000000000000000000000000000000000000000..cf6bc4219363711581895006a329eb9b3763370a
--- /dev/null
+++ b/model-00050-of-00092.safetensors
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:687cb273bfeff95fd54f89dbde8cf5a4d8245454ccbab89f09835eb57e82ac61
+size 3941946000
diff --git a/model-00051-of-00092.safetensors b/model-00051-of-00092.safetensors
new file mode 100644
index 0000000000000000000000000000000000000000..2219eca3232790f1624cf14c1dad896327412da7
--- /dev/null
+++ b/model-00051-of-00092.safetensors
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:c3a7a42e6a6f8fa0eb882ca3161c50f7692cac44dbf1e523d8e93152df634a95
+size 3941946000
diff --git a/model-00052-of-00092.safetensors b/model-00052-of-00092.safetensors
new file mode 100644
index 0000000000000000000000000000000000000000..b2e366fc4fdd3d41a74f1af71d7bee870e118772
--- /dev/null
+++ b/model-00052-of-00092.safetensors
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:23906dc240eee83293d676f597efabeb73b9b2be898bda70603fbd390f9220bf
+size 3941946000
diff --git a/model-00053-of-00092.safetensors b/model-00053-of-00092.safetensors
new file mode 100644
index 0000000000000000000000000000000000000000..e3a393f3474220ac09ad0317047c55a47e2d447a
--- /dev/null
+++ b/model-00053-of-00092.safetensors
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:be920cf049b968c844e7a6e0266218eaee1cd8bc612cf4d9972629c04add882a
+size 3941946000
diff --git a/model-00054-of-00092.safetensors b/model-00054-of-00092.safetensors
new file mode 100644
index 0000000000000000000000000000000000000000..060691c43acf4c4f35e24af5f31079d459e54fd4
--- /dev/null
+++ b/model-00054-of-00092.safetensors
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:25dcab199ede5099063a4a211374952e15e95f864988f93cea999e1ac1be1825
+size 3941946000
diff --git a/model-00055-of-00092.safetensors b/model-00055-of-00092.safetensors
new file mode 100644
index 0000000000000000000000000000000000000000..e896c37c15b1cbd746a4690651bf8668e1b2d67b
--- /dev/null
+++ b/model-00055-of-00092.safetensors
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:57c62fba715fb7373078f697eabda5c22a28a028f9a7b157d0eab44b6a2982dd
+size 3941946000
diff --git a/model-00056-of-00092.safetensors b/model-00056-of-00092.safetensors
new file mode 100644
index 0000000000000000000000000000000000000000..f64bbd248d522fde98462b30d94e8777cc40754a
--- /dev/null
+++ b/model-00056-of-00092.safetensors
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:c0d8e2336a5b79acae36c8bc2fd8245b648e402c7c0a9fd27a9ad1cdcdc55e35
+size 3941946000
diff --git a/model-00057-of-00092.safetensors b/model-00057-of-00092.safetensors
new file mode 100644
index 0000000000000000000000000000000000000000..e5651787cd4810c2656d60a30e11b9370d251815
--- /dev/null
+++ b/model-00057-of-00092.safetensors
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:9c928a35b63210c92caba603462aac155c988c2887814dfbaafb8507c4432bab
+size 3941946000
diff --git a/model-00058-of-00092.safetensors b/model-00058-of-00092.safetensors
new file mode 100644
index 0000000000000000000000000000000000000000..a0042af51f7443161d3c2273c15ab201cb1e19f0
--- /dev/null
+++ b/model-00058-of-00092.safetensors
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:39abd3b08f1247e0c59ed096e41c328141831cd297e261c4f2f6d4d15605be04
+size 3941946000
diff --git a/model-00059-of-00092.safetensors b/model-00059-of-00092.safetensors
new file mode 100644
index 0000000000000000000000000000000000000000..bd068233148883fd67c4b923c8321662215bc2db
--- /dev/null
+++ b/model-00059-of-00092.safetensors
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:ee449fec8018e00c728e353ea91f4f6749645adafb621e85a3da98f18aa48b39
+size 3941946000
diff --git a/model-00060-of-00092.safetensors b/model-00060-of-00092.safetensors
new file mode 100644
index 0000000000000000000000000000000000000000..fa52da9fc6284eb301efa35dd1077abbcfb1aab4
--- /dev/null
+++ b/model-00060-of-00092.safetensors
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:6cca12f50b985b8d566372a98a895432e66e889cd4997f37165d3aa3ad7927b9
+size 3941946000
diff --git a/model-00061-of-00092.safetensors b/model-00061-of-00092.safetensors
new file mode 100644
index 0000000000000000000000000000000000000000..b6221293eafebcd316b054fcb0b2266c92595ede
--- /dev/null
+++ b/model-00061-of-00092.safetensors
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:178e31d637b5d67e18deacac90eac7c19e2ed0381ba18967665740f979797e19
+size 3941946000
diff --git a/model-00062-of-00092.safetensors b/model-00062-of-00092.safetensors
new file mode 100644
index 0000000000000000000000000000000000000000..cebca0fa0c05007dc868347fb0ffd749fbf8c13a
--- /dev/null
+++ b/model-00062-of-00092.safetensors
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:cfd0f735b8e608a48af211b8e17836ce7b81ce91c69dd20653c71882b129f902
+size 3941946000
diff --git a/model-00063-of-00092.safetensors b/model-00063-of-00092.safetensors
new file mode 100644
index 0000000000000000000000000000000000000000..23e4df9a33c13767a6ec418def44202035cba526
--- /dev/null
+++ b/model-00063-of-00092.safetensors
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:8f79b931f9901303c4eaa2f142631375731428e685298d731d9e96b450c9579d
+size 3941946000
diff --git a/model-00064-of-00092.safetensors b/model-00064-of-00092.safetensors
new file mode 100644
index 0000000000000000000000000000000000000000..9b081e774cc85cfbc438145dae36a566d85fbe84
--- /dev/null
+++ b/model-00064-of-00092.safetensors
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:9e7154a05437423b6a1820c7cffb130ceb2a5a9b2b99ab0c868a38bb3bb8eb1f
+size 3941946000
diff --git a/model-00065-of-00092.safetensors b/model-00065-of-00092.safetensors
new file mode 100644
index 0000000000000000000000000000000000000000..a3f2d429b3f5066d674167c4732e0905462fffbf
--- /dev/null
+++ b/model-00065-of-00092.safetensors
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:6b981b155390b43bd39b2a5e3e568c1991b8d85c5966700fd2e77609af2817bd
+size 3941946000
diff --git a/model-00066-of-00092.safetensors b/model-00066-of-00092.safetensors
new file mode 100644
index 0000000000000000000000000000000000000000..1bffedee3763192b750cae595c75962ab1e589d1
--- /dev/null
+++ b/model-00066-of-00092.safetensors
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:4e5fa0a4798c9c173142b82589a5fc21208a54f81caa5464d52d4dc919839e35
+size 3941946000
diff --git a/model-00067-of-00092.safetensors b/model-00067-of-00092.safetensors
new file mode 100644
index 0000000000000000000000000000000000000000..8b6aaaa00e0d815ed997173205f50e455461fca1
--- /dev/null
+++ b/model-00067-of-00092.safetensors
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:7642e77c5b79fd69a1b3a702752cc49a9b9e6c0742615a7dffae32485bccf8dc
+size 3941946000
diff --git a/model-00068-of-00092.safetensors b/model-00068-of-00092.safetensors
new file mode 100644
index 0000000000000000000000000000000000000000..06da087afff80bb4c47db304a95a6925e03da944
--- /dev/null
+++ b/model-00068-of-00092.safetensors
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:2acab87829de540864f267c0c460ad2dd3bf4de8c6193336d803c69e68c0e118
+size 3941946000
diff --git a/model-00069-of-00092.safetensors b/model-00069-of-00092.safetensors
new file mode 100644
index 0000000000000000000000000000000000000000..03f442810bcb21897a9f39b11b02d70adee549d9
--- /dev/null
+++ b/model-00069-of-00092.safetensors
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:53ab4c3e7bda5f956fac92d641f4fa0f59ff9eb76b17f6f5784292aa91223459
+size 3941946000
diff --git a/model-00070-of-00092.safetensors b/model-00070-of-00092.safetensors
new file mode 100644
index 0000000000000000000000000000000000000000..565bc1e95f09276ef21c6d99b32d364aaf2677f4
--- /dev/null
+++ b/model-00070-of-00092.safetensors
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:ff7c3e8ac7fc32e94301f5c811f633d1cd7671c581e4afa9e3b71c3ad5900d41
+size 3941946000
diff --git a/model-00071-of-00092.safetensors b/model-00071-of-00092.safetensors
new file mode 100644
index 0000000000000000000000000000000000000000..bd260e09780ee7de5bd10e0b5bb6fe5eda517354
--- /dev/null
+++ b/model-00071-of-00092.safetensors
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:219f7d0d09cf60950f0afa6bd219801fe9b740d999ae4bcd6b29f8b067bbbe65
+size 3941946000
diff --git a/model-00072-of-00092.safetensors b/model-00072-of-00092.safetensors
new file mode 100644
index 0000000000000000000000000000000000000000..80494ca1116d7b0c82987013b5d0d4539042c408
--- /dev/null
+++ b/model-00072-of-00092.safetensors
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:5e6c90d3e3810dce5d726f3709b5c090972c2760a49179bbaf501e9350d5dfae
+size 3941946000
diff --git a/model-00073-of-00092.safetensors b/model-00073-of-00092.safetensors
new file mode 100644
index 0000000000000000000000000000000000000000..679ab1ed65baa9019ed8e2b6b1c7fa89b91c0185
--- /dev/null
+++ b/model-00073-of-00092.safetensors
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:69d544b89fbc0c8f641dca9fc57fb69b40b471f9d0af4e8ceebc509b9bd846bf
+size 3941946000
diff --git a/model-00074-of-00092.safetensors b/model-00074-of-00092.safetensors
new file mode 100644
index 0000000000000000000000000000000000000000..665812199c35801b6616ee07508f3ab3063fcbe0
--- /dev/null
+++ b/model-00074-of-00092.safetensors
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:085c3296e419064f7aaf27994ce768fb65e670aed0c4de8149203a82bf3b3f95
+size 3941946000
diff --git a/model-00075-of-00092.safetensors b/model-00075-of-00092.safetensors
new file mode 100644
index 0000000000000000000000000000000000000000..36388d8bbdd51c0fae330f4bdf19e8f4b2a399c3
--- /dev/null
+++ b/model-00075-of-00092.safetensors
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:532e038f6687377fdc85f8009b4b1b304cc45a9cff49af9dc81e031465a5fe8a
+size 3941946000
diff --git a/model-00076-of-00092.safetensors b/model-00076-of-00092.safetensors
new file mode 100644
index 0000000000000000000000000000000000000000..04011111bcd77aa168a80c4b22a4403dc02eea28
--- /dev/null
+++ b/model-00076-of-00092.safetensors
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:595028c19b4c94029a7a64500de9d5127f698a5cd5f0347e0a071db272a35322
+size 3941946000
diff --git a/model-00077-of-00092.safetensors b/model-00077-of-00092.safetensors
new file mode 100644
index 0000000000000000000000000000000000000000..11a35cfbfa4ad6383a928c00a1051c98479cc59a
--- /dev/null
+++ b/model-00077-of-00092.safetensors
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:f4bafd0685064c6855c60bce9bffcf99fb0b29e80b6603492c6c3cac46cdffa1
+size 3941946000
diff --git a/model-00078-of-00092.safetensors b/model-00078-of-00092.safetensors
new file mode 100644
index 0000000000000000000000000000000000000000..37b739ceada56331b028250838ec1aafbcc91701
--- /dev/null
+++ b/model-00078-of-00092.safetensors
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:be67adfc219969301f298e9fbea60513ec0470971e47fa7c3a6070ed3bdb0956
+size 3941946000
diff --git a/model-00079-of-00092.safetensors b/model-00079-of-00092.safetensors
new file mode 100644
index 0000000000000000000000000000000000000000..ac23cb22b66bb24938ded37fe0ca9019c946e17f
--- /dev/null
+++ b/model-00079-of-00092.safetensors
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:9fb5c4b4465d340d7dacf948dfd8d65c634cb9ec8f754596083365e232babac3
+size 3941946000
diff --git a/model-00080-of-00092.safetensors b/model-00080-of-00092.safetensors
new file mode 100644
index 0000000000000000000000000000000000000000..edc4d51c0e7e2198e8f21943cefbfdd1a009c765
--- /dev/null
+++ b/model-00080-of-00092.safetensors
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:6810cc361fe280843675844645d0211bca0546a8ef33464d91dd47940205317a
+size 3941946000
diff --git a/model-00081-of-00092.safetensors b/model-00081-of-00092.safetensors
new file mode 100644
index 0000000000000000000000000000000000000000..e17cb0fb3ee7a45c35152b0590c86bff180de455
--- /dev/null
+++ b/model-00081-of-00092.safetensors
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:593dce45d7e5a6feba3bbc00a928911b6242906b7c934d263d3d66218f5a6159
+size 3941946000
diff --git a/model-00082-of-00092.safetensors b/model-00082-of-00092.safetensors
new file mode 100644
index 0000000000000000000000000000000000000000..971106cc33b860833bdd0fdce22e8ef5641f20e2
--- /dev/null
+++ b/model-00082-of-00092.safetensors
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:0a29714ca5445705fd6ca4609f1775fb31cd3d338abccaf8fd768ccbe0049cbb
+size 3941946000
diff --git a/model-00083-of-00092.safetensors b/model-00083-of-00092.safetensors
new file mode 100644
index 0000000000000000000000000000000000000000..4a503262f35e069e222f10e3e1e450c80e70beab
--- /dev/null
+++ b/model-00083-of-00092.safetensors
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:0c62679b47cde1adb854a9de8506b1e62fd4dafc8c029780f8228234fb2dbe8f
+size 3941946000
diff --git a/model-00084-of-00092.safetensors b/model-00084-of-00092.safetensors
new file mode 100644
index 0000000000000000000000000000000000000000..fe4c41b438edcf6300f146dc93722d53fe244ae1
--- /dev/null
+++ b/model-00084-of-00092.safetensors
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:2e73e8c4a224489ba6401ba3420a0dc12a8978acc4a5da3f968c6e8e6169eb0e
+size 3941946000
diff --git a/model-00085-of-00092.safetensors b/model-00085-of-00092.safetensors
new file mode 100644
index 0000000000000000000000000000000000000000..c57b2477936e573730f627dae25c87ea34b63b4c
--- /dev/null
+++ b/model-00085-of-00092.safetensors
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:0a8585b73d4ab24e73dbbad803269cd8d8e0eef795ebd66d4f5b40a0c73a782b
+size 3941946000
diff --git a/model-00086-of-00092.safetensors b/model-00086-of-00092.safetensors
new file mode 100644
index 0000000000000000000000000000000000000000..4cb5d5c50afd285b3808c4764a0380137e778445
--- /dev/null
+++ b/model-00086-of-00092.safetensors
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:5111ae197b208badc1ea31c0eaafe8a49e649862015a023e712f500e3ced464a
+size 3941946000
diff --git a/model-00087-of-00092.safetensors b/model-00087-of-00092.safetensors
new file mode 100644
index 0000000000000000000000000000000000000000..efb225cc0719489a22d98cb239cd8612314e8492
--- /dev/null
+++ b/model-00087-of-00092.safetensors
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:0f04c69b8f445d91720f7c389613b3927425fc38be5027af99467029f860cdeb
+size 3941946000
diff --git a/model-00088-of-00092.safetensors b/model-00088-of-00092.safetensors
new file mode 100644
index 0000000000000000000000000000000000000000..9a50bb6fae4b25cbf86eafb0100a556e809b4eda
--- /dev/null
+++ b/model-00088-of-00092.safetensors
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:922beebb36eafa20e410a37737eee7c6d16d8114d1dd09c4ebccc703d51e9537
+size 3941946000
diff --git a/model-00089-of-00092.safetensors b/model-00089-of-00092.safetensors
new file mode 100644
index 0000000000000000000000000000000000000000..4f68571c0463a0e0c57e94aa115dbb64a7355f09
--- /dev/null
+++ b/model-00089-of-00092.safetensors
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:dd76187e5c79aefc3c6fad87a48c7339f6e5960c62328be1a3934f606438e101
+size 3941946000
diff --git a/model-00090-of-00092.safetensors b/model-00090-of-00092.safetensors
new file mode 100644
index 0000000000000000000000000000000000000000..cbf33d1baa193a7f269827d36f96df0fda04c448
--- /dev/null
+++ b/model-00090-of-00092.safetensors
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:f2c5c3b7d5798182b92b711177db1abd4805ab646a2450d792d8932cc3cc1330
+size 3941946000
diff --git a/model-00091-of-00092.safetensors b/model-00091-of-00092.safetensors
new file mode 100644
index 0000000000000000000000000000000000000000..c63f425d7ec7a84aa32a85777922b0bda1f102b1
--- /dev/null
+++ b/model-00091-of-00092.safetensors
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:41496ad8b78d3ffa537482a7af105055a83a271e9a10b4364b663362094088be
+size 3941946000
diff --git a/model-00092-of-00092.safetensors b/model-00092-of-00092.safetensors
new file mode 100644
index 0000000000000000000000000000000000000000..59818eb13ea7972581902f077eca5ddf72d486f1
--- /dev/null
+++ b/model-00092-of-00092.safetensors
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:8a3160dfca14b9b6f2d46f7d63228903ebaa890b169e4fe36e77366e35d73985
+size 5493849232
diff --git a/model.safetensors.index.json b/model.safetensors.index.json
new file mode 100644
index 0000000000000000000000000000000000000000..19bba211162e856fdef26980cd437c52050ad693
--- /dev/null
+++ b/model.safetensors.index.json
@@ -0,0 +1,87560 @@
+{
+ "weight_map": {
+ "model.embed_tokens.weight": "model-00001-of-00092.safetensors",
+ "model.layers.0.input_layernorm.weight": "model-00001-of-00092.safetensors",
+ "model.layers.0.mlp.down_proj.weight": "model-00001-of-00092.safetensors",
+ "model.layers.0.mlp.down_proj.weight_scale": "model-00001-of-00092.safetensors",
+ "model.layers.0.mlp.gate_proj.weight": "model-00001-of-00092.safetensors",
+ "model.layers.0.mlp.gate_proj.weight_scale": "model-00001-of-00092.safetensors",
+ "model.layers.0.mlp.up_proj.weight": "model-00001-of-00092.safetensors",
+ "model.layers.0.mlp.up_proj.weight_scale": "model-00001-of-00092.safetensors",
+ "model.layers.0.post_attention_layernorm.weight": "model-00001-of-00092.safetensors",
+ "model.layers.0.self_attn.k_norm.weight": "model-00001-of-00092.safetensors",
+ "model.layers.0.self_attn.k_proj.bias": "model-00001-of-00092.safetensors",
+ "model.layers.0.self_attn.k_proj.weight": "model-00001-of-00092.safetensors",
+ "model.layers.0.self_attn.k_proj.weight_scale": "model-00001-of-00092.safetensors",
+ "model.layers.0.self_attn.o_proj.weight": "model-00001-of-00092.safetensors",
+ "model.layers.0.self_attn.o_proj.weight_scale": "model-00001-of-00092.safetensors",
+ "model.layers.0.self_attn.q_norm.weight": "model-00001-of-00092.safetensors",
+ "model.layers.0.self_attn.q_proj.bias": "model-00001-of-00092.safetensors",
+ "model.layers.0.self_attn.q_proj.weight": "model-00001-of-00092.safetensors",
+ "model.layers.0.self_attn.q_proj.weight_scale": "model-00001-of-00092.safetensors",
+ "model.layers.0.self_attn.v_proj.bias": "model-00001-of-00092.safetensors",
+ "model.layers.0.self_attn.v_proj.weight": "model-00001-of-00092.safetensors",
+ "model.layers.0.self_attn.v_proj.weight_scale": "model-00001-of-00092.safetensors",
+ "model.layers.1.input_layernorm.weight": "model-00002-of-00092.safetensors",
+ "model.layers.1.mlp.down_proj.weight": "model-00002-of-00092.safetensors",
+ "model.layers.1.mlp.down_proj.weight_scale": "model-00002-of-00092.safetensors",
+ "model.layers.1.mlp.gate_proj.weight": "model-00002-of-00092.safetensors",
+ "model.layers.1.mlp.gate_proj.weight_scale": "model-00002-of-00092.safetensors",
+ "model.layers.1.mlp.up_proj.weight": "model-00002-of-00092.safetensors",
+ "model.layers.1.mlp.up_proj.weight_scale": "model-00002-of-00092.safetensors",
+ "model.layers.1.post_attention_layernorm.weight": "model-00002-of-00092.safetensors",
+ "model.layers.1.self_attn.k_norm.weight": "model-00002-of-00092.safetensors",
+ "model.layers.1.self_attn.k_proj.bias": "model-00002-of-00092.safetensors",
+ "model.layers.1.self_attn.k_proj.weight": "model-00002-of-00092.safetensors",
+ "model.layers.1.self_attn.k_proj.weight_scale": "model-00002-of-00092.safetensors",
+ "model.layers.1.self_attn.o_proj.weight": "model-00002-of-00092.safetensors",
+ "model.layers.1.self_attn.o_proj.weight_scale": "model-00002-of-00092.safetensors",
+ "model.layers.1.self_attn.q_norm.weight": "model-00002-of-00092.safetensors",
+ "model.layers.1.self_attn.q_proj.bias": "model-00002-of-00092.safetensors",
+ "model.layers.1.self_attn.q_proj.weight": "model-00002-of-00092.safetensors",
+ "model.layers.1.self_attn.q_proj.weight_scale": "model-00002-of-00092.safetensors",
+ "model.layers.1.self_attn.v_proj.bias": "model-00002-of-00092.safetensors",
+ "model.layers.1.self_attn.v_proj.weight": "model-00002-of-00092.safetensors",
+ "model.layers.1.self_attn.v_proj.weight_scale": "model-00002-of-00092.safetensors",
+ "model.layers.2.input_layernorm.weight": "model-00003-of-00092.safetensors",
+ "model.layers.2.mlp.down_proj.weight": "model-00003-of-00092.safetensors",
+ "model.layers.2.mlp.down_proj.weight_scale": "model-00003-of-00092.safetensors",
+ "model.layers.2.mlp.gate_proj.weight": "model-00003-of-00092.safetensors",
+ "model.layers.2.mlp.gate_proj.weight_scale": "model-00003-of-00092.safetensors",
+ "model.layers.2.mlp.up_proj.weight": "model-00003-of-00092.safetensors",
+ "model.layers.2.mlp.up_proj.weight_scale": "model-00003-of-00092.safetensors",
+ "model.layers.2.post_attention_layernorm.weight": "model-00003-of-00092.safetensors",
+ "model.layers.2.self_attn.k_norm.weight": "model-00003-of-00092.safetensors",
+ "model.layers.2.self_attn.k_proj.bias": "model-00003-of-00092.safetensors",
+ "model.layers.2.self_attn.k_proj.weight": "model-00003-of-00092.safetensors",
+ "model.layers.2.self_attn.k_proj.weight_scale": "model-00003-of-00092.safetensors",
+ "model.layers.2.self_attn.o_proj.weight": "model-00003-of-00092.safetensors",
+ "model.layers.2.self_attn.o_proj.weight_scale": "model-00003-of-00092.safetensors",
+ "model.layers.2.self_attn.q_norm.weight": "model-00003-of-00092.safetensors",
+ "model.layers.2.self_attn.q_proj.bias": "model-00003-of-00092.safetensors",
+ "model.layers.2.self_attn.q_proj.weight": "model-00003-of-00092.safetensors",
+ "model.layers.2.self_attn.q_proj.weight_scale": "model-00003-of-00092.safetensors",
+ "model.layers.2.self_attn.v_proj.bias": "model-00003-of-00092.safetensors",
+ "model.layers.2.self_attn.v_proj.weight": "model-00003-of-00092.safetensors",
+ "model.layers.2.self_attn.v_proj.weight_scale": "model-00003-of-00092.safetensors",
+ "model.layers.3.input_layernorm.weight": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.0.down_proj.weight": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.0.down_proj.weight_scale": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.0.gate_proj.weight": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.0.gate_proj.weight_scale": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.0.up_proj.weight": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.0.up_proj.weight_scale": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.1.down_proj.weight": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.1.down_proj.weight_scale": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.1.gate_proj.weight": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.1.gate_proj.weight_scale": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.1.up_proj.weight": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.1.up_proj.weight_scale": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.10.down_proj.weight": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.10.down_proj.weight_scale": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.10.gate_proj.weight": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.10.gate_proj.weight_scale": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.10.up_proj.weight": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.10.up_proj.weight_scale": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.100.down_proj.weight": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.100.down_proj.weight_scale": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.100.gate_proj.weight": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.100.gate_proj.weight_scale": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.100.up_proj.weight": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.100.up_proj.weight_scale": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.101.down_proj.weight": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.101.down_proj.weight_scale": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.101.gate_proj.weight": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.101.gate_proj.weight_scale": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.101.up_proj.weight": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.101.up_proj.weight_scale": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.102.down_proj.weight": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.102.down_proj.weight_scale": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.102.gate_proj.weight": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.102.gate_proj.weight_scale": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.102.up_proj.weight": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.102.up_proj.weight_scale": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.103.down_proj.weight": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.103.down_proj.weight_scale": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.103.gate_proj.weight": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.103.gate_proj.weight_scale": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.103.up_proj.weight": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.103.up_proj.weight_scale": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.104.down_proj.weight": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.104.down_proj.weight_scale": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.104.gate_proj.weight": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.104.gate_proj.weight_scale": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.104.up_proj.weight": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.104.up_proj.weight_scale": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.105.down_proj.weight": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.105.down_proj.weight_scale": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.105.gate_proj.weight": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.105.gate_proj.weight_scale": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.105.up_proj.weight": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.105.up_proj.weight_scale": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.106.down_proj.weight": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.106.down_proj.weight_scale": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.106.gate_proj.weight": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.106.gate_proj.weight_scale": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.106.up_proj.weight": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.106.up_proj.weight_scale": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.107.down_proj.weight": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.107.down_proj.weight_scale": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.107.gate_proj.weight": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.107.gate_proj.weight_scale": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.107.up_proj.weight": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.107.up_proj.weight_scale": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.108.down_proj.weight": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.108.down_proj.weight_scale": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.108.gate_proj.weight": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.108.gate_proj.weight_scale": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.108.up_proj.weight": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.108.up_proj.weight_scale": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.109.down_proj.weight": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.109.down_proj.weight_scale": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.109.gate_proj.weight": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.109.gate_proj.weight_scale": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.109.up_proj.weight": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.109.up_proj.weight_scale": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.11.down_proj.weight": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.11.down_proj.weight_scale": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.11.gate_proj.weight": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.11.gate_proj.weight_scale": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.11.up_proj.weight": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.11.up_proj.weight_scale": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.110.down_proj.weight": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.110.down_proj.weight_scale": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.110.gate_proj.weight": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.110.gate_proj.weight_scale": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.110.up_proj.weight": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.110.up_proj.weight_scale": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.111.down_proj.weight": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.111.down_proj.weight_scale": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.111.gate_proj.weight": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.111.gate_proj.weight_scale": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.111.up_proj.weight": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.111.up_proj.weight_scale": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.112.down_proj.weight": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.112.down_proj.weight_scale": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.112.gate_proj.weight": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.112.gate_proj.weight_scale": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.112.up_proj.weight": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.112.up_proj.weight_scale": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.113.down_proj.weight": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.113.down_proj.weight_scale": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.113.gate_proj.weight": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.113.gate_proj.weight_scale": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.113.up_proj.weight": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.113.up_proj.weight_scale": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.114.down_proj.weight": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.114.down_proj.weight_scale": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.114.gate_proj.weight": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.114.gate_proj.weight_scale": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.114.up_proj.weight": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.114.up_proj.weight_scale": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.115.down_proj.weight": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.115.down_proj.weight_scale": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.115.gate_proj.weight": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.115.gate_proj.weight_scale": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.115.up_proj.weight": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.115.up_proj.weight_scale": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.116.down_proj.weight": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.116.down_proj.weight_scale": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.116.gate_proj.weight": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.116.gate_proj.weight_scale": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.116.up_proj.weight": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.116.up_proj.weight_scale": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.117.down_proj.weight": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.117.down_proj.weight_scale": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.117.gate_proj.weight": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.117.gate_proj.weight_scale": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.117.up_proj.weight": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.117.up_proj.weight_scale": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.118.down_proj.weight": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.118.down_proj.weight_scale": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.118.gate_proj.weight": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.118.gate_proj.weight_scale": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.118.up_proj.weight": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.118.up_proj.weight_scale": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.119.down_proj.weight": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.119.down_proj.weight_scale": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.119.gate_proj.weight": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.119.gate_proj.weight_scale": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.119.up_proj.weight": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.119.up_proj.weight_scale": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.12.down_proj.weight": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.12.down_proj.weight_scale": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.12.gate_proj.weight": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.12.gate_proj.weight_scale": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.12.up_proj.weight": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.12.up_proj.weight_scale": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.120.down_proj.weight": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.120.down_proj.weight_scale": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.120.gate_proj.weight": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.120.gate_proj.weight_scale": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.120.up_proj.weight": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.120.up_proj.weight_scale": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.121.down_proj.weight": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.121.down_proj.weight_scale": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.121.gate_proj.weight": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.121.gate_proj.weight_scale": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.121.up_proj.weight": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.121.up_proj.weight_scale": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.122.down_proj.weight": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.122.down_proj.weight_scale": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.122.gate_proj.weight": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.122.gate_proj.weight_scale": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.122.up_proj.weight": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.122.up_proj.weight_scale": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.123.down_proj.weight": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.123.down_proj.weight_scale": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.123.gate_proj.weight": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.123.gate_proj.weight_scale": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.123.up_proj.weight": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.123.up_proj.weight_scale": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.124.down_proj.weight": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.124.down_proj.weight_scale": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.124.gate_proj.weight": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.124.gate_proj.weight_scale": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.124.up_proj.weight": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.124.up_proj.weight_scale": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.125.down_proj.weight": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.125.down_proj.weight_scale": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.125.gate_proj.weight": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.125.gate_proj.weight_scale": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.125.up_proj.weight": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.125.up_proj.weight_scale": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.126.down_proj.weight": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.126.down_proj.weight_scale": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.126.gate_proj.weight": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.126.gate_proj.weight_scale": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.126.up_proj.weight": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.126.up_proj.weight_scale": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.127.down_proj.weight": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.127.down_proj.weight_scale": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.127.gate_proj.weight": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.127.gate_proj.weight_scale": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.127.up_proj.weight": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.127.up_proj.weight_scale": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.128.down_proj.weight": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.128.down_proj.weight_scale": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.128.gate_proj.weight": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.128.gate_proj.weight_scale": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.128.up_proj.weight": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.128.up_proj.weight_scale": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.129.down_proj.weight": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.129.down_proj.weight_scale": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.129.gate_proj.weight": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.129.gate_proj.weight_scale": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.129.up_proj.weight": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.129.up_proj.weight_scale": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.13.down_proj.weight": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.13.down_proj.weight_scale": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.13.gate_proj.weight": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.13.gate_proj.weight_scale": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.13.up_proj.weight": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.13.up_proj.weight_scale": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.130.down_proj.weight": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.130.down_proj.weight_scale": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.130.gate_proj.weight": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.130.gate_proj.weight_scale": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.130.up_proj.weight": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.130.up_proj.weight_scale": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.131.down_proj.weight": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.131.down_proj.weight_scale": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.131.gate_proj.weight": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.131.gate_proj.weight_scale": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.131.up_proj.weight": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.131.up_proj.weight_scale": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.132.down_proj.weight": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.132.down_proj.weight_scale": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.132.gate_proj.weight": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.132.gate_proj.weight_scale": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.132.up_proj.weight": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.132.up_proj.weight_scale": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.133.down_proj.weight": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.133.down_proj.weight_scale": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.133.gate_proj.weight": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.133.gate_proj.weight_scale": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.133.up_proj.weight": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.133.up_proj.weight_scale": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.134.down_proj.weight": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.134.down_proj.weight_scale": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.134.gate_proj.weight": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.134.gate_proj.weight_scale": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.134.up_proj.weight": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.134.up_proj.weight_scale": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.135.down_proj.weight": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.135.down_proj.weight_scale": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.135.gate_proj.weight": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.135.gate_proj.weight_scale": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.135.up_proj.weight": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.135.up_proj.weight_scale": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.136.down_proj.weight": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.136.down_proj.weight_scale": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.136.gate_proj.weight": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.136.gate_proj.weight_scale": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.136.up_proj.weight": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.136.up_proj.weight_scale": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.137.down_proj.weight": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.137.down_proj.weight_scale": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.137.gate_proj.weight": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.137.gate_proj.weight_scale": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.137.up_proj.weight": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.137.up_proj.weight_scale": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.138.down_proj.weight": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.138.down_proj.weight_scale": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.138.gate_proj.weight": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.138.gate_proj.weight_scale": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.138.up_proj.weight": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.138.up_proj.weight_scale": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.139.down_proj.weight": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.139.down_proj.weight_scale": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.139.gate_proj.weight": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.139.gate_proj.weight_scale": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.139.up_proj.weight": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.139.up_proj.weight_scale": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.14.down_proj.weight": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.14.down_proj.weight_scale": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.14.gate_proj.weight": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.14.gate_proj.weight_scale": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.14.up_proj.weight": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.14.up_proj.weight_scale": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.140.down_proj.weight": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.140.down_proj.weight_scale": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.140.gate_proj.weight": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.140.gate_proj.weight_scale": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.140.up_proj.weight": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.140.up_proj.weight_scale": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.141.down_proj.weight": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.141.down_proj.weight_scale": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.141.gate_proj.weight": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.141.gate_proj.weight_scale": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.141.up_proj.weight": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.141.up_proj.weight_scale": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.142.down_proj.weight": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.142.down_proj.weight_scale": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.142.gate_proj.weight": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.142.gate_proj.weight_scale": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.142.up_proj.weight": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.142.up_proj.weight_scale": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.143.down_proj.weight": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.143.down_proj.weight_scale": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.143.gate_proj.weight": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.143.gate_proj.weight_scale": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.143.up_proj.weight": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.143.up_proj.weight_scale": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.144.down_proj.weight": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.144.down_proj.weight_scale": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.144.gate_proj.weight": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.144.gate_proj.weight_scale": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.144.up_proj.weight": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.144.up_proj.weight_scale": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.145.down_proj.weight": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.145.down_proj.weight_scale": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.145.gate_proj.weight": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.145.gate_proj.weight_scale": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.145.up_proj.weight": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.145.up_proj.weight_scale": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.146.down_proj.weight": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.146.down_proj.weight_scale": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.146.gate_proj.weight": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.146.gate_proj.weight_scale": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.146.up_proj.weight": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.146.up_proj.weight_scale": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.147.down_proj.weight": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.147.down_proj.weight_scale": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.147.gate_proj.weight": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.147.gate_proj.weight_scale": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.147.up_proj.weight": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.147.up_proj.weight_scale": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.148.down_proj.weight": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.148.down_proj.weight_scale": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.148.gate_proj.weight": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.148.gate_proj.weight_scale": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.148.up_proj.weight": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.148.up_proj.weight_scale": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.149.down_proj.weight": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.149.down_proj.weight_scale": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.149.gate_proj.weight": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.149.gate_proj.weight_scale": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.149.up_proj.weight": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.149.up_proj.weight_scale": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.15.down_proj.weight": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.15.down_proj.weight_scale": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.15.gate_proj.weight": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.15.gate_proj.weight_scale": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.15.up_proj.weight": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.15.up_proj.weight_scale": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.150.down_proj.weight": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.150.down_proj.weight_scale": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.150.gate_proj.weight": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.150.gate_proj.weight_scale": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.150.up_proj.weight": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.150.up_proj.weight_scale": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.151.down_proj.weight": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.151.down_proj.weight_scale": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.151.gate_proj.weight": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.151.gate_proj.weight_scale": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.151.up_proj.weight": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.151.up_proj.weight_scale": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.152.down_proj.weight": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.152.down_proj.weight_scale": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.152.gate_proj.weight": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.152.gate_proj.weight_scale": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.152.up_proj.weight": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.152.up_proj.weight_scale": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.153.down_proj.weight": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.153.down_proj.weight_scale": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.153.gate_proj.weight": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.153.gate_proj.weight_scale": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.153.up_proj.weight": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.153.up_proj.weight_scale": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.154.down_proj.weight": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.154.down_proj.weight_scale": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.154.gate_proj.weight": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.154.gate_proj.weight_scale": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.154.up_proj.weight": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.154.up_proj.weight_scale": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.155.down_proj.weight": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.155.down_proj.weight_scale": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.155.gate_proj.weight": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.155.gate_proj.weight_scale": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.155.up_proj.weight": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.155.up_proj.weight_scale": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.156.down_proj.weight": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.156.down_proj.weight_scale": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.156.gate_proj.weight": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.156.gate_proj.weight_scale": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.156.up_proj.weight": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.156.up_proj.weight_scale": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.157.down_proj.weight": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.157.down_proj.weight_scale": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.157.gate_proj.weight": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.157.gate_proj.weight_scale": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.157.up_proj.weight": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.157.up_proj.weight_scale": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.158.down_proj.weight": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.158.down_proj.weight_scale": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.158.gate_proj.weight": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.158.gate_proj.weight_scale": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.158.up_proj.weight": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.158.up_proj.weight_scale": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.159.down_proj.weight": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.159.down_proj.weight_scale": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.159.gate_proj.weight": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.159.gate_proj.weight_scale": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.159.up_proj.weight": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.159.up_proj.weight_scale": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.16.down_proj.weight": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.16.down_proj.weight_scale": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.16.gate_proj.weight": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.16.gate_proj.weight_scale": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.16.up_proj.weight": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.16.up_proj.weight_scale": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.17.down_proj.weight": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.17.down_proj.weight_scale": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.17.gate_proj.weight": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.17.gate_proj.weight_scale": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.17.up_proj.weight": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.17.up_proj.weight_scale": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.18.down_proj.weight": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.18.down_proj.weight_scale": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.18.gate_proj.weight": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.18.gate_proj.weight_scale": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.18.up_proj.weight": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.18.up_proj.weight_scale": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.19.down_proj.weight": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.19.down_proj.weight_scale": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.19.gate_proj.weight": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.19.gate_proj.weight_scale": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.19.up_proj.weight": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.19.up_proj.weight_scale": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.2.down_proj.weight": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.2.down_proj.weight_scale": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.2.gate_proj.weight": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.2.gate_proj.weight_scale": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.2.up_proj.weight": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.2.up_proj.weight_scale": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.20.down_proj.weight": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.20.down_proj.weight_scale": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.20.gate_proj.weight": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.20.gate_proj.weight_scale": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.20.up_proj.weight": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.20.up_proj.weight_scale": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.21.down_proj.weight": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.21.down_proj.weight_scale": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.21.gate_proj.weight": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.21.gate_proj.weight_scale": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.21.up_proj.weight": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.21.up_proj.weight_scale": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.22.down_proj.weight": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.22.down_proj.weight_scale": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.22.gate_proj.weight": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.22.gate_proj.weight_scale": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.22.up_proj.weight": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.22.up_proj.weight_scale": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.23.down_proj.weight": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.23.down_proj.weight_scale": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.23.gate_proj.weight": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.23.gate_proj.weight_scale": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.23.up_proj.weight": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.23.up_proj.weight_scale": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.24.down_proj.weight": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.24.down_proj.weight_scale": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.24.gate_proj.weight": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.24.gate_proj.weight_scale": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.24.up_proj.weight": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.24.up_proj.weight_scale": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.25.down_proj.weight": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.25.down_proj.weight_scale": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.25.gate_proj.weight": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.25.gate_proj.weight_scale": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.25.up_proj.weight": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.25.up_proj.weight_scale": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.26.down_proj.weight": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.26.down_proj.weight_scale": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.26.gate_proj.weight": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.26.gate_proj.weight_scale": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.26.up_proj.weight": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.26.up_proj.weight_scale": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.27.down_proj.weight": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.27.down_proj.weight_scale": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.27.gate_proj.weight": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.27.gate_proj.weight_scale": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.27.up_proj.weight": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.27.up_proj.weight_scale": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.28.down_proj.weight": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.28.down_proj.weight_scale": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.28.gate_proj.weight": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.28.gate_proj.weight_scale": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.28.up_proj.weight": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.28.up_proj.weight_scale": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.29.down_proj.weight": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.29.down_proj.weight_scale": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.29.gate_proj.weight": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.29.gate_proj.weight_scale": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.29.up_proj.weight": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.29.up_proj.weight_scale": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.3.down_proj.weight": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.3.down_proj.weight_scale": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.3.gate_proj.weight": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.3.gate_proj.weight_scale": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.3.up_proj.weight": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.3.up_proj.weight_scale": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.30.down_proj.weight": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.30.down_proj.weight_scale": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.30.gate_proj.weight": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.30.gate_proj.weight_scale": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.30.up_proj.weight": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.30.up_proj.weight_scale": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.31.down_proj.weight": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.31.down_proj.weight_scale": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.31.gate_proj.weight": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.31.gate_proj.weight_scale": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.31.up_proj.weight": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.31.up_proj.weight_scale": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.32.down_proj.weight": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.32.down_proj.weight_scale": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.32.gate_proj.weight": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.32.gate_proj.weight_scale": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.32.up_proj.weight": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.32.up_proj.weight_scale": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.33.down_proj.weight": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.33.down_proj.weight_scale": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.33.gate_proj.weight": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.33.gate_proj.weight_scale": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.33.up_proj.weight": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.33.up_proj.weight_scale": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.34.down_proj.weight": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.34.down_proj.weight_scale": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.34.gate_proj.weight": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.34.gate_proj.weight_scale": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.34.up_proj.weight": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.34.up_proj.weight_scale": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.35.down_proj.weight": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.35.down_proj.weight_scale": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.35.gate_proj.weight": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.35.gate_proj.weight_scale": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.35.up_proj.weight": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.35.up_proj.weight_scale": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.36.down_proj.weight": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.36.down_proj.weight_scale": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.36.gate_proj.weight": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.36.gate_proj.weight_scale": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.36.up_proj.weight": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.36.up_proj.weight_scale": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.37.down_proj.weight": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.37.down_proj.weight_scale": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.37.gate_proj.weight": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.37.gate_proj.weight_scale": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.37.up_proj.weight": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.37.up_proj.weight_scale": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.38.down_proj.weight": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.38.down_proj.weight_scale": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.38.gate_proj.weight": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.38.gate_proj.weight_scale": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.38.up_proj.weight": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.38.up_proj.weight_scale": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.39.down_proj.weight": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.39.down_proj.weight_scale": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.39.gate_proj.weight": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.39.gate_proj.weight_scale": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.39.up_proj.weight": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.39.up_proj.weight_scale": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.4.down_proj.weight": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.4.down_proj.weight_scale": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.4.gate_proj.weight": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.4.gate_proj.weight_scale": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.4.up_proj.weight": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.4.up_proj.weight_scale": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.40.down_proj.weight": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.40.down_proj.weight_scale": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.40.gate_proj.weight": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.40.gate_proj.weight_scale": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.40.up_proj.weight": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.40.up_proj.weight_scale": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.41.down_proj.weight": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.41.down_proj.weight_scale": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.41.gate_proj.weight": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.41.gate_proj.weight_scale": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.41.up_proj.weight": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.41.up_proj.weight_scale": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.42.down_proj.weight": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.42.down_proj.weight_scale": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.42.gate_proj.weight": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.42.gate_proj.weight_scale": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.42.up_proj.weight": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.42.up_proj.weight_scale": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.43.down_proj.weight": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.43.down_proj.weight_scale": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.43.gate_proj.weight": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.43.gate_proj.weight_scale": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.43.up_proj.weight": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.43.up_proj.weight_scale": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.44.down_proj.weight": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.44.down_proj.weight_scale": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.44.gate_proj.weight": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.44.gate_proj.weight_scale": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.44.up_proj.weight": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.44.up_proj.weight_scale": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.45.down_proj.weight": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.45.down_proj.weight_scale": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.45.gate_proj.weight": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.45.gate_proj.weight_scale": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.45.up_proj.weight": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.45.up_proj.weight_scale": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.46.down_proj.weight": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.46.down_proj.weight_scale": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.46.gate_proj.weight": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.46.gate_proj.weight_scale": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.46.up_proj.weight": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.46.up_proj.weight_scale": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.47.down_proj.weight": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.47.down_proj.weight_scale": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.47.gate_proj.weight": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.47.gate_proj.weight_scale": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.47.up_proj.weight": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.47.up_proj.weight_scale": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.48.down_proj.weight": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.48.down_proj.weight_scale": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.48.gate_proj.weight": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.48.gate_proj.weight_scale": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.48.up_proj.weight": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.48.up_proj.weight_scale": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.49.down_proj.weight": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.49.down_proj.weight_scale": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.49.gate_proj.weight": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.49.gate_proj.weight_scale": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.49.up_proj.weight": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.49.up_proj.weight_scale": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.5.down_proj.weight": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.5.down_proj.weight_scale": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.5.gate_proj.weight": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.5.gate_proj.weight_scale": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.5.up_proj.weight": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.5.up_proj.weight_scale": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.50.down_proj.weight": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.50.down_proj.weight_scale": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.50.gate_proj.weight": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.50.gate_proj.weight_scale": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.50.up_proj.weight": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.50.up_proj.weight_scale": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.51.down_proj.weight": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.51.down_proj.weight_scale": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.51.gate_proj.weight": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.51.gate_proj.weight_scale": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.51.up_proj.weight": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.51.up_proj.weight_scale": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.52.down_proj.weight": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.52.down_proj.weight_scale": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.52.gate_proj.weight": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.52.gate_proj.weight_scale": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.52.up_proj.weight": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.52.up_proj.weight_scale": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.53.down_proj.weight": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.53.down_proj.weight_scale": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.53.gate_proj.weight": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.53.gate_proj.weight_scale": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.53.up_proj.weight": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.53.up_proj.weight_scale": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.54.down_proj.weight": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.54.down_proj.weight_scale": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.54.gate_proj.weight": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.54.gate_proj.weight_scale": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.54.up_proj.weight": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.54.up_proj.weight_scale": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.55.down_proj.weight": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.55.down_proj.weight_scale": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.55.gate_proj.weight": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.55.gate_proj.weight_scale": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.55.up_proj.weight": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.55.up_proj.weight_scale": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.56.down_proj.weight": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.56.down_proj.weight_scale": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.56.gate_proj.weight": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.56.gate_proj.weight_scale": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.56.up_proj.weight": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.56.up_proj.weight_scale": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.57.down_proj.weight": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.57.down_proj.weight_scale": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.57.gate_proj.weight": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.57.gate_proj.weight_scale": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.57.up_proj.weight": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.57.up_proj.weight_scale": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.58.down_proj.weight": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.58.down_proj.weight_scale": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.58.gate_proj.weight": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.58.gate_proj.weight_scale": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.58.up_proj.weight": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.58.up_proj.weight_scale": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.59.down_proj.weight": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.59.down_proj.weight_scale": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.59.gate_proj.weight": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.59.gate_proj.weight_scale": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.59.up_proj.weight": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.59.up_proj.weight_scale": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.6.down_proj.weight": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.6.down_proj.weight_scale": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.6.gate_proj.weight": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.6.gate_proj.weight_scale": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.6.up_proj.weight": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.6.up_proj.weight_scale": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.60.down_proj.weight": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.60.down_proj.weight_scale": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.60.gate_proj.weight": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.60.gate_proj.weight_scale": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.60.up_proj.weight": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.60.up_proj.weight_scale": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.61.down_proj.weight": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.61.down_proj.weight_scale": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.61.gate_proj.weight": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.61.gate_proj.weight_scale": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.61.up_proj.weight": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.61.up_proj.weight_scale": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.62.down_proj.weight": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.62.down_proj.weight_scale": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.62.gate_proj.weight": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.62.gate_proj.weight_scale": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.62.up_proj.weight": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.62.up_proj.weight_scale": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.63.down_proj.weight": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.63.down_proj.weight_scale": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.63.gate_proj.weight": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.63.gate_proj.weight_scale": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.63.up_proj.weight": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.63.up_proj.weight_scale": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.64.down_proj.weight": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.64.down_proj.weight_scale": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.64.gate_proj.weight": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.64.gate_proj.weight_scale": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.64.up_proj.weight": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.64.up_proj.weight_scale": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.65.down_proj.weight": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.65.down_proj.weight_scale": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.65.gate_proj.weight": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.65.gate_proj.weight_scale": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.65.up_proj.weight": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.65.up_proj.weight_scale": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.66.down_proj.weight": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.66.down_proj.weight_scale": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.66.gate_proj.weight": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.66.gate_proj.weight_scale": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.66.up_proj.weight": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.66.up_proj.weight_scale": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.67.down_proj.weight": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.67.down_proj.weight_scale": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.67.gate_proj.weight": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.67.gate_proj.weight_scale": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.67.up_proj.weight": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.67.up_proj.weight_scale": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.68.down_proj.weight": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.68.down_proj.weight_scale": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.68.gate_proj.weight": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.68.gate_proj.weight_scale": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.68.up_proj.weight": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.68.up_proj.weight_scale": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.69.down_proj.weight": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.69.down_proj.weight_scale": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.69.gate_proj.weight": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.69.gate_proj.weight_scale": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.69.up_proj.weight": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.69.up_proj.weight_scale": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.7.down_proj.weight": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.7.down_proj.weight_scale": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.7.gate_proj.weight": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.7.gate_proj.weight_scale": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.7.up_proj.weight": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.7.up_proj.weight_scale": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.70.down_proj.weight": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.70.down_proj.weight_scale": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.70.gate_proj.weight": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.70.gate_proj.weight_scale": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.70.up_proj.weight": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.70.up_proj.weight_scale": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.71.down_proj.weight": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.71.down_proj.weight_scale": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.71.gate_proj.weight": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.71.gate_proj.weight_scale": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.71.up_proj.weight": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.71.up_proj.weight_scale": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.72.down_proj.weight": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.72.down_proj.weight_scale": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.72.gate_proj.weight": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.72.gate_proj.weight_scale": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.72.up_proj.weight": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.72.up_proj.weight_scale": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.73.down_proj.weight": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.73.down_proj.weight_scale": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.73.gate_proj.weight": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.73.gate_proj.weight_scale": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.73.up_proj.weight": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.73.up_proj.weight_scale": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.74.down_proj.weight": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.74.down_proj.weight_scale": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.74.gate_proj.weight": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.74.gate_proj.weight_scale": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.74.up_proj.weight": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.74.up_proj.weight_scale": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.75.down_proj.weight": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.75.down_proj.weight_scale": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.75.gate_proj.weight": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.75.gate_proj.weight_scale": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.75.up_proj.weight": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.75.up_proj.weight_scale": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.76.down_proj.weight": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.76.down_proj.weight_scale": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.76.gate_proj.weight": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.76.gate_proj.weight_scale": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.76.up_proj.weight": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.76.up_proj.weight_scale": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.77.down_proj.weight": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.77.down_proj.weight_scale": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.77.gate_proj.weight": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.77.gate_proj.weight_scale": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.77.up_proj.weight": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.77.up_proj.weight_scale": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.78.down_proj.weight": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.78.down_proj.weight_scale": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.78.gate_proj.weight": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.78.gate_proj.weight_scale": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.78.up_proj.weight": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.78.up_proj.weight_scale": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.79.down_proj.weight": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.79.down_proj.weight_scale": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.79.gate_proj.weight": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.79.gate_proj.weight_scale": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.79.up_proj.weight": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.79.up_proj.weight_scale": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.8.down_proj.weight": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.8.down_proj.weight_scale": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.8.gate_proj.weight": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.8.gate_proj.weight_scale": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.8.up_proj.weight": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.8.up_proj.weight_scale": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.80.down_proj.weight": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.80.down_proj.weight_scale": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.80.gate_proj.weight": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.80.gate_proj.weight_scale": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.80.up_proj.weight": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.80.up_proj.weight_scale": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.81.down_proj.weight": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.81.down_proj.weight_scale": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.81.gate_proj.weight": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.81.gate_proj.weight_scale": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.81.up_proj.weight": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.81.up_proj.weight_scale": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.82.down_proj.weight": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.82.down_proj.weight_scale": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.82.gate_proj.weight": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.82.gate_proj.weight_scale": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.82.up_proj.weight": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.82.up_proj.weight_scale": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.83.down_proj.weight": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.83.down_proj.weight_scale": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.83.gate_proj.weight": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.83.gate_proj.weight_scale": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.83.up_proj.weight": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.83.up_proj.weight_scale": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.84.down_proj.weight": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.84.down_proj.weight_scale": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.84.gate_proj.weight": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.84.gate_proj.weight_scale": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.84.up_proj.weight": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.84.up_proj.weight_scale": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.85.down_proj.weight": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.85.down_proj.weight_scale": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.85.gate_proj.weight": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.85.gate_proj.weight_scale": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.85.up_proj.weight": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.85.up_proj.weight_scale": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.86.down_proj.weight": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.86.down_proj.weight_scale": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.86.gate_proj.weight": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.86.gate_proj.weight_scale": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.86.up_proj.weight": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.86.up_proj.weight_scale": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.87.down_proj.weight": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.87.down_proj.weight_scale": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.87.gate_proj.weight": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.87.gate_proj.weight_scale": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.87.up_proj.weight": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.87.up_proj.weight_scale": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.88.down_proj.weight": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.88.down_proj.weight_scale": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.88.gate_proj.weight": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.88.gate_proj.weight_scale": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.88.up_proj.weight": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.88.up_proj.weight_scale": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.89.down_proj.weight": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.89.down_proj.weight_scale": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.89.gate_proj.weight": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.89.gate_proj.weight_scale": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.89.up_proj.weight": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.89.up_proj.weight_scale": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.9.down_proj.weight": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.9.down_proj.weight_scale": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.9.gate_proj.weight": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.9.gate_proj.weight_scale": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.9.up_proj.weight": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.9.up_proj.weight_scale": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.90.down_proj.weight": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.90.down_proj.weight_scale": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.90.gate_proj.weight": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.90.gate_proj.weight_scale": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.90.up_proj.weight": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.90.up_proj.weight_scale": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.91.down_proj.weight": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.91.down_proj.weight_scale": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.91.gate_proj.weight": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.91.gate_proj.weight_scale": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.91.up_proj.weight": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.91.up_proj.weight_scale": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.92.down_proj.weight": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.92.down_proj.weight_scale": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.92.gate_proj.weight": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.92.gate_proj.weight_scale": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.92.up_proj.weight": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.92.up_proj.weight_scale": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.93.down_proj.weight": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.93.down_proj.weight_scale": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.93.gate_proj.weight": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.93.gate_proj.weight_scale": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.93.up_proj.weight": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.93.up_proj.weight_scale": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.94.down_proj.weight": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.94.down_proj.weight_scale": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.94.gate_proj.weight": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.94.gate_proj.weight_scale": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.94.up_proj.weight": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.94.up_proj.weight_scale": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.95.down_proj.weight": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.95.down_proj.weight_scale": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.95.gate_proj.weight": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.95.gate_proj.weight_scale": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.95.up_proj.weight": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.95.up_proj.weight_scale": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.96.down_proj.weight": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.96.down_proj.weight_scale": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.96.gate_proj.weight": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.96.gate_proj.weight_scale": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.96.up_proj.weight": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.96.up_proj.weight_scale": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.97.down_proj.weight": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.97.down_proj.weight_scale": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.97.gate_proj.weight": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.97.gate_proj.weight_scale": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.97.up_proj.weight": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.97.up_proj.weight_scale": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.98.down_proj.weight": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.98.down_proj.weight_scale": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.98.gate_proj.weight": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.98.gate_proj.weight_scale": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.98.up_proj.weight": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.98.up_proj.weight_scale": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.99.down_proj.weight": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.99.down_proj.weight_scale": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.99.gate_proj.weight": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.99.gate_proj.weight_scale": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.99.up_proj.weight": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.99.up_proj.weight_scale": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.gate.e_score_correction_bias": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.gate.weight": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.shared_experts.down_proj.weight": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.shared_experts.down_proj.weight_scale": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.shared_experts.gate_proj.weight": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.shared_experts.gate_proj.weight_scale": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.shared_experts.up_proj.weight": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.shared_experts.up_proj.weight_scale": "model-00004-of-00092.safetensors",
+ "model.layers.3.post_attention_layernorm.weight": "model-00004-of-00092.safetensors",
+ "model.layers.3.self_attn.k_norm.weight": "model-00004-of-00092.safetensors",
+ "model.layers.3.self_attn.k_proj.bias": "model-00004-of-00092.safetensors",
+ "model.layers.3.self_attn.k_proj.weight": "model-00004-of-00092.safetensors",
+ "model.layers.3.self_attn.k_proj.weight_scale": "model-00004-of-00092.safetensors",
+ "model.layers.3.self_attn.o_proj.weight": "model-00004-of-00092.safetensors",
+ "model.layers.3.self_attn.o_proj.weight_scale": "model-00004-of-00092.safetensors",
+ "model.layers.3.self_attn.q_norm.weight": "model-00004-of-00092.safetensors",
+ "model.layers.3.self_attn.q_proj.bias": "model-00004-of-00092.safetensors",
+ "model.layers.3.self_attn.q_proj.weight": "model-00004-of-00092.safetensors",
+ "model.layers.3.self_attn.q_proj.weight_scale": "model-00004-of-00092.safetensors",
+ "model.layers.3.self_attn.v_proj.bias": "model-00004-of-00092.safetensors",
+ "model.layers.3.self_attn.v_proj.weight": "model-00004-of-00092.safetensors",
+ "model.layers.3.self_attn.v_proj.weight_scale": "model-00004-of-00092.safetensors",
+ "model.layers.4.input_layernorm.weight": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.0.down_proj.weight": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.0.down_proj.weight_scale": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.0.gate_proj.weight": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.0.gate_proj.weight_scale": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.0.up_proj.weight": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.0.up_proj.weight_scale": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.1.down_proj.weight": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.1.down_proj.weight_scale": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.1.gate_proj.weight": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.1.gate_proj.weight_scale": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.1.up_proj.weight": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.1.up_proj.weight_scale": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.10.down_proj.weight": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.10.down_proj.weight_scale": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.10.gate_proj.weight": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.10.gate_proj.weight_scale": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.10.up_proj.weight": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.10.up_proj.weight_scale": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.100.down_proj.weight": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.100.down_proj.weight_scale": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.100.gate_proj.weight": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.100.gate_proj.weight_scale": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.100.up_proj.weight": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.100.up_proj.weight_scale": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.101.down_proj.weight": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.101.down_proj.weight_scale": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.101.gate_proj.weight": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.101.gate_proj.weight_scale": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.101.up_proj.weight": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.101.up_proj.weight_scale": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.102.down_proj.weight": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.102.down_proj.weight_scale": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.102.gate_proj.weight": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.102.gate_proj.weight_scale": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.102.up_proj.weight": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.102.up_proj.weight_scale": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.103.down_proj.weight": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.103.down_proj.weight_scale": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.103.gate_proj.weight": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.103.gate_proj.weight_scale": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.103.up_proj.weight": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.103.up_proj.weight_scale": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.104.down_proj.weight": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.104.down_proj.weight_scale": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.104.gate_proj.weight": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.104.gate_proj.weight_scale": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.104.up_proj.weight": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.104.up_proj.weight_scale": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.105.down_proj.weight": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.105.down_proj.weight_scale": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.105.gate_proj.weight": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.105.gate_proj.weight_scale": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.105.up_proj.weight": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.105.up_proj.weight_scale": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.106.down_proj.weight": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.106.down_proj.weight_scale": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.106.gate_proj.weight": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.106.gate_proj.weight_scale": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.106.up_proj.weight": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.106.up_proj.weight_scale": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.107.down_proj.weight": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.107.down_proj.weight_scale": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.107.gate_proj.weight": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.107.gate_proj.weight_scale": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.107.up_proj.weight": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.107.up_proj.weight_scale": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.108.down_proj.weight": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.108.down_proj.weight_scale": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.108.gate_proj.weight": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.108.gate_proj.weight_scale": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.108.up_proj.weight": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.108.up_proj.weight_scale": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.109.down_proj.weight": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.109.down_proj.weight_scale": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.109.gate_proj.weight": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.109.gate_proj.weight_scale": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.109.up_proj.weight": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.109.up_proj.weight_scale": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.11.down_proj.weight": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.11.down_proj.weight_scale": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.11.gate_proj.weight": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.11.gate_proj.weight_scale": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.11.up_proj.weight": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.11.up_proj.weight_scale": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.110.down_proj.weight": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.110.down_proj.weight_scale": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.110.gate_proj.weight": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.110.gate_proj.weight_scale": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.110.up_proj.weight": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.110.up_proj.weight_scale": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.111.down_proj.weight": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.111.down_proj.weight_scale": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.111.gate_proj.weight": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.111.gate_proj.weight_scale": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.111.up_proj.weight": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.111.up_proj.weight_scale": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.112.down_proj.weight": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.112.down_proj.weight_scale": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.112.gate_proj.weight": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.112.gate_proj.weight_scale": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.112.up_proj.weight": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.112.up_proj.weight_scale": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.113.down_proj.weight": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.113.down_proj.weight_scale": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.113.gate_proj.weight": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.113.gate_proj.weight_scale": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.113.up_proj.weight": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.113.up_proj.weight_scale": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.114.down_proj.weight": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.114.down_proj.weight_scale": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.114.gate_proj.weight": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.114.gate_proj.weight_scale": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.114.up_proj.weight": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.114.up_proj.weight_scale": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.115.down_proj.weight": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.115.down_proj.weight_scale": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.115.gate_proj.weight": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.115.gate_proj.weight_scale": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.115.up_proj.weight": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.115.up_proj.weight_scale": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.116.down_proj.weight": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.116.down_proj.weight_scale": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.116.gate_proj.weight": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.116.gate_proj.weight_scale": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.116.up_proj.weight": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.116.up_proj.weight_scale": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.117.down_proj.weight": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.117.down_proj.weight_scale": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.117.gate_proj.weight": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.117.gate_proj.weight_scale": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.117.up_proj.weight": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.117.up_proj.weight_scale": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.118.down_proj.weight": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.118.down_proj.weight_scale": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.118.gate_proj.weight": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.118.gate_proj.weight_scale": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.118.up_proj.weight": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.118.up_proj.weight_scale": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.119.down_proj.weight": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.119.down_proj.weight_scale": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.119.gate_proj.weight": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.119.gate_proj.weight_scale": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.119.up_proj.weight": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.119.up_proj.weight_scale": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.12.down_proj.weight": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.12.down_proj.weight_scale": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.12.gate_proj.weight": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.12.gate_proj.weight_scale": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.12.up_proj.weight": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.12.up_proj.weight_scale": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.120.down_proj.weight": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.120.down_proj.weight_scale": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.120.gate_proj.weight": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.120.gate_proj.weight_scale": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.120.up_proj.weight": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.120.up_proj.weight_scale": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.121.down_proj.weight": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.121.down_proj.weight_scale": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.121.gate_proj.weight": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.121.gate_proj.weight_scale": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.121.up_proj.weight": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.121.up_proj.weight_scale": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.122.down_proj.weight": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.122.down_proj.weight_scale": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.122.gate_proj.weight": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.122.gate_proj.weight_scale": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.122.up_proj.weight": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.122.up_proj.weight_scale": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.123.down_proj.weight": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.123.down_proj.weight_scale": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.123.gate_proj.weight": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.123.gate_proj.weight_scale": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.123.up_proj.weight": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.123.up_proj.weight_scale": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.124.down_proj.weight": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.124.down_proj.weight_scale": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.124.gate_proj.weight": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.124.gate_proj.weight_scale": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.124.up_proj.weight": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.124.up_proj.weight_scale": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.125.down_proj.weight": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.125.down_proj.weight_scale": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.125.gate_proj.weight": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.125.gate_proj.weight_scale": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.125.up_proj.weight": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.125.up_proj.weight_scale": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.126.down_proj.weight": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.126.down_proj.weight_scale": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.126.gate_proj.weight": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.126.gate_proj.weight_scale": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.126.up_proj.weight": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.126.up_proj.weight_scale": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.127.down_proj.weight": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.127.down_proj.weight_scale": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.127.gate_proj.weight": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.127.gate_proj.weight_scale": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.127.up_proj.weight": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.127.up_proj.weight_scale": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.128.down_proj.weight": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.128.down_proj.weight_scale": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.128.gate_proj.weight": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.128.gate_proj.weight_scale": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.128.up_proj.weight": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.128.up_proj.weight_scale": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.129.down_proj.weight": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.129.down_proj.weight_scale": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.129.gate_proj.weight": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.129.gate_proj.weight_scale": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.129.up_proj.weight": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.129.up_proj.weight_scale": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.13.down_proj.weight": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.13.down_proj.weight_scale": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.13.gate_proj.weight": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.13.gate_proj.weight_scale": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.13.up_proj.weight": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.13.up_proj.weight_scale": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.130.down_proj.weight": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.130.down_proj.weight_scale": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.130.gate_proj.weight": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.130.gate_proj.weight_scale": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.130.up_proj.weight": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.130.up_proj.weight_scale": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.131.down_proj.weight": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.131.down_proj.weight_scale": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.131.gate_proj.weight": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.131.gate_proj.weight_scale": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.131.up_proj.weight": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.131.up_proj.weight_scale": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.132.down_proj.weight": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.132.down_proj.weight_scale": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.132.gate_proj.weight": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.132.gate_proj.weight_scale": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.132.up_proj.weight": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.132.up_proj.weight_scale": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.133.down_proj.weight": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.133.down_proj.weight_scale": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.133.gate_proj.weight": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.133.gate_proj.weight_scale": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.133.up_proj.weight": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.133.up_proj.weight_scale": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.134.down_proj.weight": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.134.down_proj.weight_scale": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.134.gate_proj.weight": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.134.gate_proj.weight_scale": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.134.up_proj.weight": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.134.up_proj.weight_scale": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.135.down_proj.weight": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.135.down_proj.weight_scale": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.135.gate_proj.weight": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.135.gate_proj.weight_scale": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.135.up_proj.weight": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.135.up_proj.weight_scale": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.136.down_proj.weight": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.136.down_proj.weight_scale": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.136.gate_proj.weight": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.136.gate_proj.weight_scale": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.136.up_proj.weight": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.136.up_proj.weight_scale": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.137.down_proj.weight": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.137.down_proj.weight_scale": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.137.gate_proj.weight": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.137.gate_proj.weight_scale": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.137.up_proj.weight": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.137.up_proj.weight_scale": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.138.down_proj.weight": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.138.down_proj.weight_scale": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.138.gate_proj.weight": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.138.gate_proj.weight_scale": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.138.up_proj.weight": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.138.up_proj.weight_scale": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.139.down_proj.weight": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.139.down_proj.weight_scale": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.139.gate_proj.weight": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.139.gate_proj.weight_scale": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.139.up_proj.weight": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.139.up_proj.weight_scale": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.14.down_proj.weight": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.14.down_proj.weight_scale": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.14.gate_proj.weight": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.14.gate_proj.weight_scale": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.14.up_proj.weight": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.14.up_proj.weight_scale": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.140.down_proj.weight": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.140.down_proj.weight_scale": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.140.gate_proj.weight": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.140.gate_proj.weight_scale": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.140.up_proj.weight": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.140.up_proj.weight_scale": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.141.down_proj.weight": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.141.down_proj.weight_scale": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.141.gate_proj.weight": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.141.gate_proj.weight_scale": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.141.up_proj.weight": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.141.up_proj.weight_scale": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.142.down_proj.weight": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.142.down_proj.weight_scale": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.142.gate_proj.weight": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.142.gate_proj.weight_scale": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.142.up_proj.weight": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.142.up_proj.weight_scale": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.143.down_proj.weight": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.143.down_proj.weight_scale": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.143.gate_proj.weight": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.143.gate_proj.weight_scale": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.143.up_proj.weight": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.143.up_proj.weight_scale": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.144.down_proj.weight": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.144.down_proj.weight_scale": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.144.gate_proj.weight": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.144.gate_proj.weight_scale": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.144.up_proj.weight": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.144.up_proj.weight_scale": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.145.down_proj.weight": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.145.down_proj.weight_scale": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.145.gate_proj.weight": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.145.gate_proj.weight_scale": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.145.up_proj.weight": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.145.up_proj.weight_scale": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.146.down_proj.weight": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.146.down_proj.weight_scale": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.146.gate_proj.weight": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.146.gate_proj.weight_scale": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.146.up_proj.weight": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.146.up_proj.weight_scale": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.147.down_proj.weight": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.147.down_proj.weight_scale": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.147.gate_proj.weight": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.147.gate_proj.weight_scale": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.147.up_proj.weight": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.147.up_proj.weight_scale": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.148.down_proj.weight": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.148.down_proj.weight_scale": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.148.gate_proj.weight": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.148.gate_proj.weight_scale": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.148.up_proj.weight": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.148.up_proj.weight_scale": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.149.down_proj.weight": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.149.down_proj.weight_scale": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.149.gate_proj.weight": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.149.gate_proj.weight_scale": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.149.up_proj.weight": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.149.up_proj.weight_scale": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.15.down_proj.weight": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.15.down_proj.weight_scale": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.15.gate_proj.weight": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.15.gate_proj.weight_scale": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.15.up_proj.weight": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.15.up_proj.weight_scale": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.150.down_proj.weight": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.150.down_proj.weight_scale": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.150.gate_proj.weight": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.150.gate_proj.weight_scale": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.150.up_proj.weight": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.150.up_proj.weight_scale": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.151.down_proj.weight": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.151.down_proj.weight_scale": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.151.gate_proj.weight": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.151.gate_proj.weight_scale": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.151.up_proj.weight": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.151.up_proj.weight_scale": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.152.down_proj.weight": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.152.down_proj.weight_scale": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.152.gate_proj.weight": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.152.gate_proj.weight_scale": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.152.up_proj.weight": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.152.up_proj.weight_scale": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.153.down_proj.weight": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.153.down_proj.weight_scale": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.153.gate_proj.weight": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.153.gate_proj.weight_scale": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.153.up_proj.weight": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.153.up_proj.weight_scale": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.154.down_proj.weight": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.154.down_proj.weight_scale": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.154.gate_proj.weight": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.154.gate_proj.weight_scale": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.154.up_proj.weight": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.154.up_proj.weight_scale": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.155.down_proj.weight": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.155.down_proj.weight_scale": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.155.gate_proj.weight": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.155.gate_proj.weight_scale": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.155.up_proj.weight": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.155.up_proj.weight_scale": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.156.down_proj.weight": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.156.down_proj.weight_scale": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.156.gate_proj.weight": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.156.gate_proj.weight_scale": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.156.up_proj.weight": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.156.up_proj.weight_scale": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.157.down_proj.weight": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.157.down_proj.weight_scale": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.157.gate_proj.weight": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.157.gate_proj.weight_scale": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.157.up_proj.weight": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.157.up_proj.weight_scale": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.158.down_proj.weight": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.158.down_proj.weight_scale": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.158.gate_proj.weight": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.158.gate_proj.weight_scale": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.158.up_proj.weight": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.158.up_proj.weight_scale": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.159.down_proj.weight": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.159.down_proj.weight_scale": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.159.gate_proj.weight": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.159.gate_proj.weight_scale": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.159.up_proj.weight": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.159.up_proj.weight_scale": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.16.down_proj.weight": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.16.down_proj.weight_scale": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.16.gate_proj.weight": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.16.gate_proj.weight_scale": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.16.up_proj.weight": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.16.up_proj.weight_scale": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.17.down_proj.weight": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.17.down_proj.weight_scale": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.17.gate_proj.weight": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.17.gate_proj.weight_scale": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.17.up_proj.weight": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.17.up_proj.weight_scale": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.18.down_proj.weight": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.18.down_proj.weight_scale": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.18.gate_proj.weight": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.18.gate_proj.weight_scale": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.18.up_proj.weight": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.18.up_proj.weight_scale": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.19.down_proj.weight": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.19.down_proj.weight_scale": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.19.gate_proj.weight": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.19.gate_proj.weight_scale": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.19.up_proj.weight": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.19.up_proj.weight_scale": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.2.down_proj.weight": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.2.down_proj.weight_scale": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.2.gate_proj.weight": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.2.gate_proj.weight_scale": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.2.up_proj.weight": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.2.up_proj.weight_scale": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.20.down_proj.weight": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.20.down_proj.weight_scale": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.20.gate_proj.weight": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.20.gate_proj.weight_scale": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.20.up_proj.weight": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.20.up_proj.weight_scale": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.21.down_proj.weight": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.21.down_proj.weight_scale": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.21.gate_proj.weight": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.21.gate_proj.weight_scale": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.21.up_proj.weight": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.21.up_proj.weight_scale": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.22.down_proj.weight": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.22.down_proj.weight_scale": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.22.gate_proj.weight": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.22.gate_proj.weight_scale": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.22.up_proj.weight": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.22.up_proj.weight_scale": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.23.down_proj.weight": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.23.down_proj.weight_scale": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.23.gate_proj.weight": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.23.gate_proj.weight_scale": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.23.up_proj.weight": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.23.up_proj.weight_scale": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.24.down_proj.weight": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.24.down_proj.weight_scale": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.24.gate_proj.weight": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.24.gate_proj.weight_scale": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.24.up_proj.weight": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.24.up_proj.weight_scale": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.25.down_proj.weight": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.25.down_proj.weight_scale": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.25.gate_proj.weight": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.25.gate_proj.weight_scale": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.25.up_proj.weight": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.25.up_proj.weight_scale": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.26.down_proj.weight": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.26.down_proj.weight_scale": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.26.gate_proj.weight": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.26.gate_proj.weight_scale": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.26.up_proj.weight": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.26.up_proj.weight_scale": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.27.down_proj.weight": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.27.down_proj.weight_scale": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.27.gate_proj.weight": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.27.gate_proj.weight_scale": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.27.up_proj.weight": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.27.up_proj.weight_scale": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.28.down_proj.weight": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.28.down_proj.weight_scale": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.28.gate_proj.weight": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.28.gate_proj.weight_scale": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.28.up_proj.weight": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.28.up_proj.weight_scale": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.29.down_proj.weight": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.29.down_proj.weight_scale": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.29.gate_proj.weight": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.29.gate_proj.weight_scale": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.29.up_proj.weight": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.29.up_proj.weight_scale": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.3.down_proj.weight": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.3.down_proj.weight_scale": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.3.gate_proj.weight": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.3.gate_proj.weight_scale": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.3.up_proj.weight": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.3.up_proj.weight_scale": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.30.down_proj.weight": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.30.down_proj.weight_scale": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.30.gate_proj.weight": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.30.gate_proj.weight_scale": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.30.up_proj.weight": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.30.up_proj.weight_scale": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.31.down_proj.weight": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.31.down_proj.weight_scale": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.31.gate_proj.weight": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.31.gate_proj.weight_scale": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.31.up_proj.weight": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.31.up_proj.weight_scale": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.32.down_proj.weight": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.32.down_proj.weight_scale": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.32.gate_proj.weight": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.32.gate_proj.weight_scale": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.32.up_proj.weight": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.32.up_proj.weight_scale": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.33.down_proj.weight": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.33.down_proj.weight_scale": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.33.gate_proj.weight": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.33.gate_proj.weight_scale": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.33.up_proj.weight": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.33.up_proj.weight_scale": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.34.down_proj.weight": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.34.down_proj.weight_scale": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.34.gate_proj.weight": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.34.gate_proj.weight_scale": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.34.up_proj.weight": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.34.up_proj.weight_scale": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.35.down_proj.weight": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.35.down_proj.weight_scale": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.35.gate_proj.weight": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.35.gate_proj.weight_scale": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.35.up_proj.weight": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.35.up_proj.weight_scale": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.36.down_proj.weight": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.36.down_proj.weight_scale": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.36.gate_proj.weight": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.36.gate_proj.weight_scale": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.36.up_proj.weight": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.36.up_proj.weight_scale": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.37.down_proj.weight": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.37.down_proj.weight_scale": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.37.gate_proj.weight": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.37.gate_proj.weight_scale": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.37.up_proj.weight": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.37.up_proj.weight_scale": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.38.down_proj.weight": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.38.down_proj.weight_scale": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.38.gate_proj.weight": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.38.gate_proj.weight_scale": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.38.up_proj.weight": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.38.up_proj.weight_scale": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.39.down_proj.weight": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.39.down_proj.weight_scale": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.39.gate_proj.weight": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.39.gate_proj.weight_scale": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.39.up_proj.weight": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.39.up_proj.weight_scale": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.4.down_proj.weight": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.4.down_proj.weight_scale": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.4.gate_proj.weight": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.4.gate_proj.weight_scale": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.4.up_proj.weight": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.4.up_proj.weight_scale": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.40.down_proj.weight": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.40.down_proj.weight_scale": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.40.gate_proj.weight": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.40.gate_proj.weight_scale": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.40.up_proj.weight": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.40.up_proj.weight_scale": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.41.down_proj.weight": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.41.down_proj.weight_scale": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.41.gate_proj.weight": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.41.gate_proj.weight_scale": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.41.up_proj.weight": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.41.up_proj.weight_scale": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.42.down_proj.weight": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.42.down_proj.weight_scale": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.42.gate_proj.weight": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.42.gate_proj.weight_scale": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.42.up_proj.weight": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.42.up_proj.weight_scale": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.43.down_proj.weight": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.43.down_proj.weight_scale": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.43.gate_proj.weight": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.43.gate_proj.weight_scale": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.43.up_proj.weight": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.43.up_proj.weight_scale": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.44.down_proj.weight": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.44.down_proj.weight_scale": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.44.gate_proj.weight": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.44.gate_proj.weight_scale": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.44.up_proj.weight": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.44.up_proj.weight_scale": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.45.down_proj.weight": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.45.down_proj.weight_scale": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.45.gate_proj.weight": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.45.gate_proj.weight_scale": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.45.up_proj.weight": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.45.up_proj.weight_scale": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.46.down_proj.weight": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.46.down_proj.weight_scale": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.46.gate_proj.weight": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.46.gate_proj.weight_scale": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.46.up_proj.weight": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.46.up_proj.weight_scale": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.47.down_proj.weight": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.47.down_proj.weight_scale": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.47.gate_proj.weight": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.47.gate_proj.weight_scale": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.47.up_proj.weight": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.47.up_proj.weight_scale": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.48.down_proj.weight": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.48.down_proj.weight_scale": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.48.gate_proj.weight": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.48.gate_proj.weight_scale": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.48.up_proj.weight": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.48.up_proj.weight_scale": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.49.down_proj.weight": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.49.down_proj.weight_scale": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.49.gate_proj.weight": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.49.gate_proj.weight_scale": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.49.up_proj.weight": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.49.up_proj.weight_scale": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.5.down_proj.weight": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.5.down_proj.weight_scale": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.5.gate_proj.weight": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.5.gate_proj.weight_scale": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.5.up_proj.weight": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.5.up_proj.weight_scale": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.50.down_proj.weight": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.50.down_proj.weight_scale": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.50.gate_proj.weight": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.50.gate_proj.weight_scale": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.50.up_proj.weight": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.50.up_proj.weight_scale": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.51.down_proj.weight": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.51.down_proj.weight_scale": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.51.gate_proj.weight": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.51.gate_proj.weight_scale": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.51.up_proj.weight": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.51.up_proj.weight_scale": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.52.down_proj.weight": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.52.down_proj.weight_scale": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.52.gate_proj.weight": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.52.gate_proj.weight_scale": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.52.up_proj.weight": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.52.up_proj.weight_scale": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.53.down_proj.weight": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.53.down_proj.weight_scale": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.53.gate_proj.weight": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.53.gate_proj.weight_scale": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.53.up_proj.weight": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.53.up_proj.weight_scale": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.54.down_proj.weight": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.54.down_proj.weight_scale": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.54.gate_proj.weight": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.54.gate_proj.weight_scale": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.54.up_proj.weight": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.54.up_proj.weight_scale": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.55.down_proj.weight": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.55.down_proj.weight_scale": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.55.gate_proj.weight": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.55.gate_proj.weight_scale": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.55.up_proj.weight": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.55.up_proj.weight_scale": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.56.down_proj.weight": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.56.down_proj.weight_scale": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.56.gate_proj.weight": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.56.gate_proj.weight_scale": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.56.up_proj.weight": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.56.up_proj.weight_scale": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.57.down_proj.weight": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.57.down_proj.weight_scale": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.57.gate_proj.weight": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.57.gate_proj.weight_scale": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.57.up_proj.weight": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.57.up_proj.weight_scale": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.58.down_proj.weight": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.58.down_proj.weight_scale": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.58.gate_proj.weight": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.58.gate_proj.weight_scale": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.58.up_proj.weight": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.58.up_proj.weight_scale": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.59.down_proj.weight": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.59.down_proj.weight_scale": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.59.gate_proj.weight": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.59.gate_proj.weight_scale": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.59.up_proj.weight": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.59.up_proj.weight_scale": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.6.down_proj.weight": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.6.down_proj.weight_scale": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.6.gate_proj.weight": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.6.gate_proj.weight_scale": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.6.up_proj.weight": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.6.up_proj.weight_scale": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.60.down_proj.weight": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.60.down_proj.weight_scale": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.60.gate_proj.weight": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.60.gate_proj.weight_scale": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.60.up_proj.weight": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.60.up_proj.weight_scale": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.61.down_proj.weight": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.61.down_proj.weight_scale": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.61.gate_proj.weight": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.61.gate_proj.weight_scale": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.61.up_proj.weight": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.61.up_proj.weight_scale": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.62.down_proj.weight": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.62.down_proj.weight_scale": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.62.gate_proj.weight": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.62.gate_proj.weight_scale": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.62.up_proj.weight": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.62.up_proj.weight_scale": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.63.down_proj.weight": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.63.down_proj.weight_scale": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.63.gate_proj.weight": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.63.gate_proj.weight_scale": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.63.up_proj.weight": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.63.up_proj.weight_scale": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.64.down_proj.weight": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.64.down_proj.weight_scale": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.64.gate_proj.weight": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.64.gate_proj.weight_scale": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.64.up_proj.weight": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.64.up_proj.weight_scale": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.65.down_proj.weight": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.65.down_proj.weight_scale": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.65.gate_proj.weight": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.65.gate_proj.weight_scale": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.65.up_proj.weight": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.65.up_proj.weight_scale": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.66.down_proj.weight": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.66.down_proj.weight_scale": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.66.gate_proj.weight": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.66.gate_proj.weight_scale": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.66.up_proj.weight": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.66.up_proj.weight_scale": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.67.down_proj.weight": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.67.down_proj.weight_scale": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.67.gate_proj.weight": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.67.gate_proj.weight_scale": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.67.up_proj.weight": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.67.up_proj.weight_scale": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.68.down_proj.weight": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.68.down_proj.weight_scale": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.68.gate_proj.weight": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.68.gate_proj.weight_scale": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.68.up_proj.weight": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.68.up_proj.weight_scale": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.69.down_proj.weight": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.69.down_proj.weight_scale": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.69.gate_proj.weight": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.69.gate_proj.weight_scale": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.69.up_proj.weight": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.69.up_proj.weight_scale": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.7.down_proj.weight": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.7.down_proj.weight_scale": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.7.gate_proj.weight": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.7.gate_proj.weight_scale": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.7.up_proj.weight": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.7.up_proj.weight_scale": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.70.down_proj.weight": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.70.down_proj.weight_scale": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.70.gate_proj.weight": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.70.gate_proj.weight_scale": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.70.up_proj.weight": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.70.up_proj.weight_scale": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.71.down_proj.weight": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.71.down_proj.weight_scale": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.71.gate_proj.weight": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.71.gate_proj.weight_scale": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.71.up_proj.weight": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.71.up_proj.weight_scale": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.72.down_proj.weight": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.72.down_proj.weight_scale": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.72.gate_proj.weight": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.72.gate_proj.weight_scale": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.72.up_proj.weight": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.72.up_proj.weight_scale": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.73.down_proj.weight": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.73.down_proj.weight_scale": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.73.gate_proj.weight": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.73.gate_proj.weight_scale": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.73.up_proj.weight": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.73.up_proj.weight_scale": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.74.down_proj.weight": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.74.down_proj.weight_scale": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.74.gate_proj.weight": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.74.gate_proj.weight_scale": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.74.up_proj.weight": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.74.up_proj.weight_scale": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.75.down_proj.weight": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.75.down_proj.weight_scale": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.75.gate_proj.weight": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.75.gate_proj.weight_scale": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.75.up_proj.weight": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.75.up_proj.weight_scale": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.76.down_proj.weight": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.76.down_proj.weight_scale": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.76.gate_proj.weight": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.76.gate_proj.weight_scale": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.76.up_proj.weight": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.76.up_proj.weight_scale": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.77.down_proj.weight": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.77.down_proj.weight_scale": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.77.gate_proj.weight": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.77.gate_proj.weight_scale": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.77.up_proj.weight": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.77.up_proj.weight_scale": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.78.down_proj.weight": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.78.down_proj.weight_scale": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.78.gate_proj.weight": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.78.gate_proj.weight_scale": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.78.up_proj.weight": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.78.up_proj.weight_scale": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.79.down_proj.weight": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.79.down_proj.weight_scale": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.79.gate_proj.weight": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.79.gate_proj.weight_scale": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.79.up_proj.weight": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.79.up_proj.weight_scale": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.8.down_proj.weight": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.8.down_proj.weight_scale": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.8.gate_proj.weight": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.8.gate_proj.weight_scale": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.8.up_proj.weight": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.8.up_proj.weight_scale": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.80.down_proj.weight": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.80.down_proj.weight_scale": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.80.gate_proj.weight": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.80.gate_proj.weight_scale": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.80.up_proj.weight": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.80.up_proj.weight_scale": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.81.down_proj.weight": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.81.down_proj.weight_scale": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.81.gate_proj.weight": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.81.gate_proj.weight_scale": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.81.up_proj.weight": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.81.up_proj.weight_scale": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.82.down_proj.weight": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.82.down_proj.weight_scale": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.82.gate_proj.weight": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.82.gate_proj.weight_scale": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.82.up_proj.weight": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.82.up_proj.weight_scale": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.83.down_proj.weight": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.83.down_proj.weight_scale": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.83.gate_proj.weight": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.83.gate_proj.weight_scale": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.83.up_proj.weight": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.83.up_proj.weight_scale": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.84.down_proj.weight": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.84.down_proj.weight_scale": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.84.gate_proj.weight": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.84.gate_proj.weight_scale": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.84.up_proj.weight": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.84.up_proj.weight_scale": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.85.down_proj.weight": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.85.down_proj.weight_scale": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.85.gate_proj.weight": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.85.gate_proj.weight_scale": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.85.up_proj.weight": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.85.up_proj.weight_scale": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.86.down_proj.weight": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.86.down_proj.weight_scale": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.86.gate_proj.weight": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.86.gate_proj.weight_scale": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.86.up_proj.weight": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.86.up_proj.weight_scale": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.87.down_proj.weight": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.87.down_proj.weight_scale": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.87.gate_proj.weight": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.87.gate_proj.weight_scale": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.87.up_proj.weight": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.87.up_proj.weight_scale": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.88.down_proj.weight": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.88.down_proj.weight_scale": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.88.gate_proj.weight": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.88.gate_proj.weight_scale": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.88.up_proj.weight": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.88.up_proj.weight_scale": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.89.down_proj.weight": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.89.down_proj.weight_scale": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.89.gate_proj.weight": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.89.gate_proj.weight_scale": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.89.up_proj.weight": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.89.up_proj.weight_scale": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.9.down_proj.weight": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.9.down_proj.weight_scale": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.9.gate_proj.weight": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.9.gate_proj.weight_scale": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.9.up_proj.weight": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.9.up_proj.weight_scale": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.90.down_proj.weight": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.90.down_proj.weight_scale": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.90.gate_proj.weight": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.90.gate_proj.weight_scale": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.90.up_proj.weight": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.90.up_proj.weight_scale": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.91.down_proj.weight": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.91.down_proj.weight_scale": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.91.gate_proj.weight": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.91.gate_proj.weight_scale": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.91.up_proj.weight": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.91.up_proj.weight_scale": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.92.down_proj.weight": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.92.down_proj.weight_scale": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.92.gate_proj.weight": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.92.gate_proj.weight_scale": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.92.up_proj.weight": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.92.up_proj.weight_scale": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.93.down_proj.weight": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.93.down_proj.weight_scale": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.93.gate_proj.weight": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.93.gate_proj.weight_scale": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.93.up_proj.weight": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.93.up_proj.weight_scale": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.94.down_proj.weight": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.94.down_proj.weight_scale": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.94.gate_proj.weight": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.94.gate_proj.weight_scale": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.94.up_proj.weight": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.94.up_proj.weight_scale": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.95.down_proj.weight": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.95.down_proj.weight_scale": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.95.gate_proj.weight": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.95.gate_proj.weight_scale": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.95.up_proj.weight": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.95.up_proj.weight_scale": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.96.down_proj.weight": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.96.down_proj.weight_scale": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.96.gate_proj.weight": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.96.gate_proj.weight_scale": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.96.up_proj.weight": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.96.up_proj.weight_scale": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.97.down_proj.weight": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.97.down_proj.weight_scale": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.97.gate_proj.weight": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.97.gate_proj.weight_scale": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.97.up_proj.weight": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.97.up_proj.weight_scale": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.98.down_proj.weight": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.98.down_proj.weight_scale": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.98.gate_proj.weight": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.98.gate_proj.weight_scale": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.98.up_proj.weight": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.98.up_proj.weight_scale": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.99.down_proj.weight": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.99.down_proj.weight_scale": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.99.gate_proj.weight": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.99.gate_proj.weight_scale": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.99.up_proj.weight": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.99.up_proj.weight_scale": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.gate.e_score_correction_bias": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.gate.weight": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.shared_experts.down_proj.weight": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.shared_experts.down_proj.weight_scale": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.shared_experts.gate_proj.weight": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.shared_experts.gate_proj.weight_scale": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.shared_experts.up_proj.weight": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.shared_experts.up_proj.weight_scale": "model-00005-of-00092.safetensors",
+ "model.layers.4.post_attention_layernorm.weight": "model-00005-of-00092.safetensors",
+ "model.layers.4.self_attn.k_norm.weight": "model-00005-of-00092.safetensors",
+ "model.layers.4.self_attn.k_proj.bias": "model-00005-of-00092.safetensors",
+ "model.layers.4.self_attn.k_proj.weight": "model-00005-of-00092.safetensors",
+ "model.layers.4.self_attn.k_proj.weight_scale": "model-00005-of-00092.safetensors",
+ "model.layers.4.self_attn.o_proj.weight": "model-00005-of-00092.safetensors",
+ "model.layers.4.self_attn.o_proj.weight_scale": "model-00005-of-00092.safetensors",
+ "model.layers.4.self_attn.q_norm.weight": "model-00005-of-00092.safetensors",
+ "model.layers.4.self_attn.q_proj.bias": "model-00005-of-00092.safetensors",
+ "model.layers.4.self_attn.q_proj.weight": "model-00005-of-00092.safetensors",
+ "model.layers.4.self_attn.q_proj.weight_scale": "model-00005-of-00092.safetensors",
+ "model.layers.4.self_attn.v_proj.bias": "model-00005-of-00092.safetensors",
+ "model.layers.4.self_attn.v_proj.weight": "model-00005-of-00092.safetensors",
+ "model.layers.4.self_attn.v_proj.weight_scale": "model-00005-of-00092.safetensors",
+ "model.layers.5.input_layernorm.weight": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.0.down_proj.weight": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.0.down_proj.weight_scale": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.0.gate_proj.weight": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.0.gate_proj.weight_scale": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.0.up_proj.weight": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.0.up_proj.weight_scale": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.1.down_proj.weight": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.1.down_proj.weight_scale": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.1.gate_proj.weight": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.1.gate_proj.weight_scale": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.1.up_proj.weight": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.1.up_proj.weight_scale": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.10.down_proj.weight": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.10.down_proj.weight_scale": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.10.gate_proj.weight": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.10.gate_proj.weight_scale": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.10.up_proj.weight": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.10.up_proj.weight_scale": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.100.down_proj.weight": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.100.down_proj.weight_scale": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.100.gate_proj.weight": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.100.gate_proj.weight_scale": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.100.up_proj.weight": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.100.up_proj.weight_scale": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.101.down_proj.weight": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.101.down_proj.weight_scale": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.101.gate_proj.weight": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.101.gate_proj.weight_scale": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.101.up_proj.weight": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.101.up_proj.weight_scale": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.102.down_proj.weight": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.102.down_proj.weight_scale": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.102.gate_proj.weight": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.102.gate_proj.weight_scale": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.102.up_proj.weight": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.102.up_proj.weight_scale": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.103.down_proj.weight": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.103.down_proj.weight_scale": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.103.gate_proj.weight": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.103.gate_proj.weight_scale": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.103.up_proj.weight": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.103.up_proj.weight_scale": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.104.down_proj.weight": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.104.down_proj.weight_scale": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.104.gate_proj.weight": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.104.gate_proj.weight_scale": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.104.up_proj.weight": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.104.up_proj.weight_scale": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.105.down_proj.weight": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.105.down_proj.weight_scale": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.105.gate_proj.weight": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.105.gate_proj.weight_scale": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.105.up_proj.weight": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.105.up_proj.weight_scale": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.106.down_proj.weight": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.106.down_proj.weight_scale": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.106.gate_proj.weight": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.106.gate_proj.weight_scale": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.106.up_proj.weight": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.106.up_proj.weight_scale": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.107.down_proj.weight": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.107.down_proj.weight_scale": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.107.gate_proj.weight": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.107.gate_proj.weight_scale": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.107.up_proj.weight": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.107.up_proj.weight_scale": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.108.down_proj.weight": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.108.down_proj.weight_scale": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.108.gate_proj.weight": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.108.gate_proj.weight_scale": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.108.up_proj.weight": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.108.up_proj.weight_scale": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.109.down_proj.weight": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.109.down_proj.weight_scale": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.109.gate_proj.weight": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.109.gate_proj.weight_scale": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.109.up_proj.weight": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.109.up_proj.weight_scale": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.11.down_proj.weight": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.11.down_proj.weight_scale": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.11.gate_proj.weight": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.11.gate_proj.weight_scale": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.11.up_proj.weight": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.11.up_proj.weight_scale": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.110.down_proj.weight": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.110.down_proj.weight_scale": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.110.gate_proj.weight": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.110.gate_proj.weight_scale": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.110.up_proj.weight": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.110.up_proj.weight_scale": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.111.down_proj.weight": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.111.down_proj.weight_scale": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.111.gate_proj.weight": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.111.gate_proj.weight_scale": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.111.up_proj.weight": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.111.up_proj.weight_scale": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.112.down_proj.weight": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.112.down_proj.weight_scale": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.112.gate_proj.weight": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.112.gate_proj.weight_scale": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.112.up_proj.weight": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.112.up_proj.weight_scale": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.113.down_proj.weight": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.113.down_proj.weight_scale": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.113.gate_proj.weight": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.113.gate_proj.weight_scale": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.113.up_proj.weight": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.113.up_proj.weight_scale": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.114.down_proj.weight": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.114.down_proj.weight_scale": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.114.gate_proj.weight": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.114.gate_proj.weight_scale": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.114.up_proj.weight": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.114.up_proj.weight_scale": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.115.down_proj.weight": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.115.down_proj.weight_scale": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.115.gate_proj.weight": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.115.gate_proj.weight_scale": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.115.up_proj.weight": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.115.up_proj.weight_scale": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.116.down_proj.weight": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.116.down_proj.weight_scale": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.116.gate_proj.weight": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.116.gate_proj.weight_scale": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.116.up_proj.weight": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.116.up_proj.weight_scale": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.117.down_proj.weight": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.117.down_proj.weight_scale": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.117.gate_proj.weight": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.117.gate_proj.weight_scale": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.117.up_proj.weight": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.117.up_proj.weight_scale": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.118.down_proj.weight": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.118.down_proj.weight_scale": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.118.gate_proj.weight": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.118.gate_proj.weight_scale": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.118.up_proj.weight": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.118.up_proj.weight_scale": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.119.down_proj.weight": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.119.down_proj.weight_scale": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.119.gate_proj.weight": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.119.gate_proj.weight_scale": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.119.up_proj.weight": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.119.up_proj.weight_scale": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.12.down_proj.weight": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.12.down_proj.weight_scale": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.12.gate_proj.weight": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.12.gate_proj.weight_scale": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.12.up_proj.weight": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.12.up_proj.weight_scale": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.120.down_proj.weight": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.120.down_proj.weight_scale": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.120.gate_proj.weight": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.120.gate_proj.weight_scale": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.120.up_proj.weight": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.120.up_proj.weight_scale": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.121.down_proj.weight": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.121.down_proj.weight_scale": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.121.gate_proj.weight": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.121.gate_proj.weight_scale": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.121.up_proj.weight": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.121.up_proj.weight_scale": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.122.down_proj.weight": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.122.down_proj.weight_scale": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.122.gate_proj.weight": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.122.gate_proj.weight_scale": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.122.up_proj.weight": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.122.up_proj.weight_scale": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.123.down_proj.weight": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.123.down_proj.weight_scale": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.123.gate_proj.weight": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.123.gate_proj.weight_scale": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.123.up_proj.weight": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.123.up_proj.weight_scale": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.124.down_proj.weight": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.124.down_proj.weight_scale": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.124.gate_proj.weight": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.124.gate_proj.weight_scale": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.124.up_proj.weight": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.124.up_proj.weight_scale": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.125.down_proj.weight": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.125.down_proj.weight_scale": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.125.gate_proj.weight": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.125.gate_proj.weight_scale": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.125.up_proj.weight": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.125.up_proj.weight_scale": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.126.down_proj.weight": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.126.down_proj.weight_scale": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.126.gate_proj.weight": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.126.gate_proj.weight_scale": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.126.up_proj.weight": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.126.up_proj.weight_scale": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.127.down_proj.weight": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.127.down_proj.weight_scale": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.127.gate_proj.weight": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.127.gate_proj.weight_scale": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.127.up_proj.weight": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.127.up_proj.weight_scale": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.128.down_proj.weight": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.128.down_proj.weight_scale": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.128.gate_proj.weight": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.128.gate_proj.weight_scale": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.128.up_proj.weight": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.128.up_proj.weight_scale": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.129.down_proj.weight": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.129.down_proj.weight_scale": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.129.gate_proj.weight": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.129.gate_proj.weight_scale": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.129.up_proj.weight": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.129.up_proj.weight_scale": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.13.down_proj.weight": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.13.down_proj.weight_scale": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.13.gate_proj.weight": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.13.gate_proj.weight_scale": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.13.up_proj.weight": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.13.up_proj.weight_scale": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.130.down_proj.weight": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.130.down_proj.weight_scale": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.130.gate_proj.weight": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.130.gate_proj.weight_scale": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.130.up_proj.weight": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.130.up_proj.weight_scale": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.131.down_proj.weight": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.131.down_proj.weight_scale": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.131.gate_proj.weight": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.131.gate_proj.weight_scale": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.131.up_proj.weight": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.131.up_proj.weight_scale": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.132.down_proj.weight": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.132.down_proj.weight_scale": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.132.gate_proj.weight": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.132.gate_proj.weight_scale": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.132.up_proj.weight": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.132.up_proj.weight_scale": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.133.down_proj.weight": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.133.down_proj.weight_scale": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.133.gate_proj.weight": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.133.gate_proj.weight_scale": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.133.up_proj.weight": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.133.up_proj.weight_scale": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.134.down_proj.weight": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.134.down_proj.weight_scale": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.134.gate_proj.weight": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.134.gate_proj.weight_scale": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.134.up_proj.weight": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.134.up_proj.weight_scale": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.135.down_proj.weight": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.135.down_proj.weight_scale": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.135.gate_proj.weight": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.135.gate_proj.weight_scale": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.135.up_proj.weight": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.135.up_proj.weight_scale": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.136.down_proj.weight": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.136.down_proj.weight_scale": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.136.gate_proj.weight": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.136.gate_proj.weight_scale": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.136.up_proj.weight": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.136.up_proj.weight_scale": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.137.down_proj.weight": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.137.down_proj.weight_scale": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.137.gate_proj.weight": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.137.gate_proj.weight_scale": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.137.up_proj.weight": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.137.up_proj.weight_scale": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.138.down_proj.weight": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.138.down_proj.weight_scale": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.138.gate_proj.weight": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.138.gate_proj.weight_scale": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.138.up_proj.weight": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.138.up_proj.weight_scale": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.139.down_proj.weight": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.139.down_proj.weight_scale": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.139.gate_proj.weight": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.139.gate_proj.weight_scale": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.139.up_proj.weight": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.139.up_proj.weight_scale": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.14.down_proj.weight": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.14.down_proj.weight_scale": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.14.gate_proj.weight": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.14.gate_proj.weight_scale": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.14.up_proj.weight": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.14.up_proj.weight_scale": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.140.down_proj.weight": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.140.down_proj.weight_scale": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.140.gate_proj.weight": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.140.gate_proj.weight_scale": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.140.up_proj.weight": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.140.up_proj.weight_scale": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.141.down_proj.weight": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.141.down_proj.weight_scale": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.141.gate_proj.weight": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.141.gate_proj.weight_scale": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.141.up_proj.weight": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.141.up_proj.weight_scale": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.142.down_proj.weight": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.142.down_proj.weight_scale": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.142.gate_proj.weight": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.142.gate_proj.weight_scale": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.142.up_proj.weight": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.142.up_proj.weight_scale": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.143.down_proj.weight": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.143.down_proj.weight_scale": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.143.gate_proj.weight": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.143.gate_proj.weight_scale": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.143.up_proj.weight": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.143.up_proj.weight_scale": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.144.down_proj.weight": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.144.down_proj.weight_scale": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.144.gate_proj.weight": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.144.gate_proj.weight_scale": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.144.up_proj.weight": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.144.up_proj.weight_scale": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.145.down_proj.weight": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.145.down_proj.weight_scale": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.145.gate_proj.weight": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.145.gate_proj.weight_scale": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.145.up_proj.weight": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.145.up_proj.weight_scale": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.146.down_proj.weight": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.146.down_proj.weight_scale": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.146.gate_proj.weight": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.146.gate_proj.weight_scale": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.146.up_proj.weight": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.146.up_proj.weight_scale": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.147.down_proj.weight": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.147.down_proj.weight_scale": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.147.gate_proj.weight": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.147.gate_proj.weight_scale": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.147.up_proj.weight": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.147.up_proj.weight_scale": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.148.down_proj.weight": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.148.down_proj.weight_scale": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.148.gate_proj.weight": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.148.gate_proj.weight_scale": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.148.up_proj.weight": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.148.up_proj.weight_scale": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.149.down_proj.weight": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.149.down_proj.weight_scale": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.149.gate_proj.weight": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.149.gate_proj.weight_scale": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.149.up_proj.weight": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.149.up_proj.weight_scale": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.15.down_proj.weight": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.15.down_proj.weight_scale": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.15.gate_proj.weight": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.15.gate_proj.weight_scale": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.15.up_proj.weight": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.15.up_proj.weight_scale": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.150.down_proj.weight": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.150.down_proj.weight_scale": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.150.gate_proj.weight": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.150.gate_proj.weight_scale": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.150.up_proj.weight": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.150.up_proj.weight_scale": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.151.down_proj.weight": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.151.down_proj.weight_scale": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.151.gate_proj.weight": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.151.gate_proj.weight_scale": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.151.up_proj.weight": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.151.up_proj.weight_scale": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.152.down_proj.weight": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.152.down_proj.weight_scale": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.152.gate_proj.weight": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.152.gate_proj.weight_scale": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.152.up_proj.weight": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.152.up_proj.weight_scale": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.153.down_proj.weight": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.153.down_proj.weight_scale": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.153.gate_proj.weight": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.153.gate_proj.weight_scale": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.153.up_proj.weight": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.153.up_proj.weight_scale": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.154.down_proj.weight": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.154.down_proj.weight_scale": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.154.gate_proj.weight": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.154.gate_proj.weight_scale": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.154.up_proj.weight": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.154.up_proj.weight_scale": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.155.down_proj.weight": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.155.down_proj.weight_scale": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.155.gate_proj.weight": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.155.gate_proj.weight_scale": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.155.up_proj.weight": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.155.up_proj.weight_scale": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.156.down_proj.weight": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.156.down_proj.weight_scale": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.156.gate_proj.weight": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.156.gate_proj.weight_scale": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.156.up_proj.weight": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.156.up_proj.weight_scale": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.157.down_proj.weight": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.157.down_proj.weight_scale": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.157.gate_proj.weight": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.157.gate_proj.weight_scale": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.157.up_proj.weight": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.157.up_proj.weight_scale": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.158.down_proj.weight": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.158.down_proj.weight_scale": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.158.gate_proj.weight": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.158.gate_proj.weight_scale": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.158.up_proj.weight": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.158.up_proj.weight_scale": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.159.down_proj.weight": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.159.down_proj.weight_scale": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.159.gate_proj.weight": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.159.gate_proj.weight_scale": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.159.up_proj.weight": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.159.up_proj.weight_scale": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.16.down_proj.weight": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.16.down_proj.weight_scale": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.16.gate_proj.weight": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.16.gate_proj.weight_scale": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.16.up_proj.weight": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.16.up_proj.weight_scale": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.17.down_proj.weight": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.17.down_proj.weight_scale": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.17.gate_proj.weight": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.17.gate_proj.weight_scale": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.17.up_proj.weight": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.17.up_proj.weight_scale": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.18.down_proj.weight": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.18.down_proj.weight_scale": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.18.gate_proj.weight": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.18.gate_proj.weight_scale": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.18.up_proj.weight": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.18.up_proj.weight_scale": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.19.down_proj.weight": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.19.down_proj.weight_scale": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.19.gate_proj.weight": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.19.gate_proj.weight_scale": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.19.up_proj.weight": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.19.up_proj.weight_scale": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.2.down_proj.weight": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.2.down_proj.weight_scale": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.2.gate_proj.weight": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.2.gate_proj.weight_scale": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.2.up_proj.weight": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.2.up_proj.weight_scale": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.20.down_proj.weight": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.20.down_proj.weight_scale": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.20.gate_proj.weight": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.20.gate_proj.weight_scale": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.20.up_proj.weight": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.20.up_proj.weight_scale": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.21.down_proj.weight": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.21.down_proj.weight_scale": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.21.gate_proj.weight": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.21.gate_proj.weight_scale": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.21.up_proj.weight": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.21.up_proj.weight_scale": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.22.down_proj.weight": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.22.down_proj.weight_scale": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.22.gate_proj.weight": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.22.gate_proj.weight_scale": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.22.up_proj.weight": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.22.up_proj.weight_scale": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.23.down_proj.weight": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.23.down_proj.weight_scale": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.23.gate_proj.weight": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.23.gate_proj.weight_scale": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.23.up_proj.weight": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.23.up_proj.weight_scale": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.24.down_proj.weight": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.24.down_proj.weight_scale": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.24.gate_proj.weight": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.24.gate_proj.weight_scale": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.24.up_proj.weight": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.24.up_proj.weight_scale": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.25.down_proj.weight": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.25.down_proj.weight_scale": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.25.gate_proj.weight": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.25.gate_proj.weight_scale": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.25.up_proj.weight": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.25.up_proj.weight_scale": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.26.down_proj.weight": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.26.down_proj.weight_scale": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.26.gate_proj.weight": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.26.gate_proj.weight_scale": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.26.up_proj.weight": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.26.up_proj.weight_scale": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.27.down_proj.weight": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.27.down_proj.weight_scale": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.27.gate_proj.weight": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.27.gate_proj.weight_scale": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.27.up_proj.weight": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.27.up_proj.weight_scale": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.28.down_proj.weight": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.28.down_proj.weight_scale": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.28.gate_proj.weight": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.28.gate_proj.weight_scale": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.28.up_proj.weight": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.28.up_proj.weight_scale": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.29.down_proj.weight": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.29.down_proj.weight_scale": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.29.gate_proj.weight": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.29.gate_proj.weight_scale": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.29.up_proj.weight": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.29.up_proj.weight_scale": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.3.down_proj.weight": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.3.down_proj.weight_scale": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.3.gate_proj.weight": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.3.gate_proj.weight_scale": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.3.up_proj.weight": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.3.up_proj.weight_scale": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.30.down_proj.weight": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.30.down_proj.weight_scale": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.30.gate_proj.weight": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.30.gate_proj.weight_scale": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.30.up_proj.weight": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.30.up_proj.weight_scale": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.31.down_proj.weight": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.31.down_proj.weight_scale": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.31.gate_proj.weight": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.31.gate_proj.weight_scale": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.31.up_proj.weight": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.31.up_proj.weight_scale": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.32.down_proj.weight": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.32.down_proj.weight_scale": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.32.gate_proj.weight": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.32.gate_proj.weight_scale": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.32.up_proj.weight": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.32.up_proj.weight_scale": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.33.down_proj.weight": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.33.down_proj.weight_scale": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.33.gate_proj.weight": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.33.gate_proj.weight_scale": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.33.up_proj.weight": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.33.up_proj.weight_scale": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.34.down_proj.weight": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.34.down_proj.weight_scale": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.34.gate_proj.weight": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.34.gate_proj.weight_scale": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.34.up_proj.weight": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.34.up_proj.weight_scale": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.35.down_proj.weight": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.35.down_proj.weight_scale": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.35.gate_proj.weight": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.35.gate_proj.weight_scale": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.35.up_proj.weight": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.35.up_proj.weight_scale": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.36.down_proj.weight": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.36.down_proj.weight_scale": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.36.gate_proj.weight": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.36.gate_proj.weight_scale": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.36.up_proj.weight": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.36.up_proj.weight_scale": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.37.down_proj.weight": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.37.down_proj.weight_scale": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.37.gate_proj.weight": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.37.gate_proj.weight_scale": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.37.up_proj.weight": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.37.up_proj.weight_scale": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.38.down_proj.weight": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.38.down_proj.weight_scale": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.38.gate_proj.weight": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.38.gate_proj.weight_scale": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.38.up_proj.weight": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.38.up_proj.weight_scale": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.39.down_proj.weight": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.39.down_proj.weight_scale": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.39.gate_proj.weight": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.39.gate_proj.weight_scale": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.39.up_proj.weight": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.39.up_proj.weight_scale": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.4.down_proj.weight": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.4.down_proj.weight_scale": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.4.gate_proj.weight": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.4.gate_proj.weight_scale": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.4.up_proj.weight": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.4.up_proj.weight_scale": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.40.down_proj.weight": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.40.down_proj.weight_scale": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.40.gate_proj.weight": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.40.gate_proj.weight_scale": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.40.up_proj.weight": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.40.up_proj.weight_scale": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.41.down_proj.weight": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.41.down_proj.weight_scale": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.41.gate_proj.weight": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.41.gate_proj.weight_scale": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.41.up_proj.weight": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.41.up_proj.weight_scale": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.42.down_proj.weight": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.42.down_proj.weight_scale": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.42.gate_proj.weight": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.42.gate_proj.weight_scale": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.42.up_proj.weight": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.42.up_proj.weight_scale": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.43.down_proj.weight": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.43.down_proj.weight_scale": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.43.gate_proj.weight": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.43.gate_proj.weight_scale": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.43.up_proj.weight": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.43.up_proj.weight_scale": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.44.down_proj.weight": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.44.down_proj.weight_scale": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.44.gate_proj.weight": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.44.gate_proj.weight_scale": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.44.up_proj.weight": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.44.up_proj.weight_scale": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.45.down_proj.weight": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.45.down_proj.weight_scale": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.45.gate_proj.weight": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.45.gate_proj.weight_scale": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.45.up_proj.weight": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.45.up_proj.weight_scale": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.46.down_proj.weight": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.46.down_proj.weight_scale": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.46.gate_proj.weight": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.46.gate_proj.weight_scale": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.46.up_proj.weight": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.46.up_proj.weight_scale": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.47.down_proj.weight": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.47.down_proj.weight_scale": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.47.gate_proj.weight": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.47.gate_proj.weight_scale": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.47.up_proj.weight": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.47.up_proj.weight_scale": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.48.down_proj.weight": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.48.down_proj.weight_scale": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.48.gate_proj.weight": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.48.gate_proj.weight_scale": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.48.up_proj.weight": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.48.up_proj.weight_scale": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.49.down_proj.weight": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.49.down_proj.weight_scale": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.49.gate_proj.weight": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.49.gate_proj.weight_scale": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.49.up_proj.weight": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.49.up_proj.weight_scale": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.5.down_proj.weight": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.5.down_proj.weight_scale": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.5.gate_proj.weight": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.5.gate_proj.weight_scale": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.5.up_proj.weight": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.5.up_proj.weight_scale": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.50.down_proj.weight": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.50.down_proj.weight_scale": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.50.gate_proj.weight": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.50.gate_proj.weight_scale": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.50.up_proj.weight": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.50.up_proj.weight_scale": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.51.down_proj.weight": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.51.down_proj.weight_scale": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.51.gate_proj.weight": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.51.gate_proj.weight_scale": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.51.up_proj.weight": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.51.up_proj.weight_scale": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.52.down_proj.weight": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.52.down_proj.weight_scale": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.52.gate_proj.weight": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.52.gate_proj.weight_scale": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.52.up_proj.weight": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.52.up_proj.weight_scale": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.53.down_proj.weight": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.53.down_proj.weight_scale": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.53.gate_proj.weight": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.53.gate_proj.weight_scale": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.53.up_proj.weight": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.53.up_proj.weight_scale": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.54.down_proj.weight": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.54.down_proj.weight_scale": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.54.gate_proj.weight": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.54.gate_proj.weight_scale": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.54.up_proj.weight": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.54.up_proj.weight_scale": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.55.down_proj.weight": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.55.down_proj.weight_scale": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.55.gate_proj.weight": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.55.gate_proj.weight_scale": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.55.up_proj.weight": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.55.up_proj.weight_scale": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.56.down_proj.weight": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.56.down_proj.weight_scale": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.56.gate_proj.weight": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.56.gate_proj.weight_scale": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.56.up_proj.weight": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.56.up_proj.weight_scale": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.57.down_proj.weight": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.57.down_proj.weight_scale": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.57.gate_proj.weight": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.57.gate_proj.weight_scale": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.57.up_proj.weight": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.57.up_proj.weight_scale": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.58.down_proj.weight": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.58.down_proj.weight_scale": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.58.gate_proj.weight": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.58.gate_proj.weight_scale": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.58.up_proj.weight": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.58.up_proj.weight_scale": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.59.down_proj.weight": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.59.down_proj.weight_scale": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.59.gate_proj.weight": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.59.gate_proj.weight_scale": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.59.up_proj.weight": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.59.up_proj.weight_scale": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.6.down_proj.weight": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.6.down_proj.weight_scale": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.6.gate_proj.weight": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.6.gate_proj.weight_scale": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.6.up_proj.weight": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.6.up_proj.weight_scale": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.60.down_proj.weight": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.60.down_proj.weight_scale": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.60.gate_proj.weight": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.60.gate_proj.weight_scale": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.60.up_proj.weight": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.60.up_proj.weight_scale": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.61.down_proj.weight": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.61.down_proj.weight_scale": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.61.gate_proj.weight": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.61.gate_proj.weight_scale": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.61.up_proj.weight": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.61.up_proj.weight_scale": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.62.down_proj.weight": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.62.down_proj.weight_scale": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.62.gate_proj.weight": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.62.gate_proj.weight_scale": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.62.up_proj.weight": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.62.up_proj.weight_scale": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.63.down_proj.weight": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.63.down_proj.weight_scale": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.63.gate_proj.weight": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.63.gate_proj.weight_scale": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.63.up_proj.weight": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.63.up_proj.weight_scale": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.64.down_proj.weight": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.64.down_proj.weight_scale": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.64.gate_proj.weight": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.64.gate_proj.weight_scale": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.64.up_proj.weight": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.64.up_proj.weight_scale": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.65.down_proj.weight": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.65.down_proj.weight_scale": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.65.gate_proj.weight": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.65.gate_proj.weight_scale": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.65.up_proj.weight": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.65.up_proj.weight_scale": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.66.down_proj.weight": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.66.down_proj.weight_scale": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.66.gate_proj.weight": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.66.gate_proj.weight_scale": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.66.up_proj.weight": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.66.up_proj.weight_scale": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.67.down_proj.weight": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.67.down_proj.weight_scale": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.67.gate_proj.weight": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.67.gate_proj.weight_scale": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.67.up_proj.weight": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.67.up_proj.weight_scale": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.68.down_proj.weight": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.68.down_proj.weight_scale": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.68.gate_proj.weight": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.68.gate_proj.weight_scale": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.68.up_proj.weight": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.68.up_proj.weight_scale": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.69.down_proj.weight": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.69.down_proj.weight_scale": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.69.gate_proj.weight": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.69.gate_proj.weight_scale": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.69.up_proj.weight": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.69.up_proj.weight_scale": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.7.down_proj.weight": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.7.down_proj.weight_scale": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.7.gate_proj.weight": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.7.gate_proj.weight_scale": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.7.up_proj.weight": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.7.up_proj.weight_scale": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.70.down_proj.weight": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.70.down_proj.weight_scale": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.70.gate_proj.weight": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.70.gate_proj.weight_scale": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.70.up_proj.weight": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.70.up_proj.weight_scale": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.71.down_proj.weight": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.71.down_proj.weight_scale": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.71.gate_proj.weight": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.71.gate_proj.weight_scale": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.71.up_proj.weight": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.71.up_proj.weight_scale": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.72.down_proj.weight": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.72.down_proj.weight_scale": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.72.gate_proj.weight": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.72.gate_proj.weight_scale": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.72.up_proj.weight": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.72.up_proj.weight_scale": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.73.down_proj.weight": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.73.down_proj.weight_scale": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.73.gate_proj.weight": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.73.gate_proj.weight_scale": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.73.up_proj.weight": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.73.up_proj.weight_scale": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.74.down_proj.weight": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.74.down_proj.weight_scale": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.74.gate_proj.weight": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.74.gate_proj.weight_scale": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.74.up_proj.weight": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.74.up_proj.weight_scale": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.75.down_proj.weight": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.75.down_proj.weight_scale": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.75.gate_proj.weight": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.75.gate_proj.weight_scale": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.75.up_proj.weight": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.75.up_proj.weight_scale": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.76.down_proj.weight": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.76.down_proj.weight_scale": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.76.gate_proj.weight": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.76.gate_proj.weight_scale": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.76.up_proj.weight": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.76.up_proj.weight_scale": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.77.down_proj.weight": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.77.down_proj.weight_scale": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.77.gate_proj.weight": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.77.gate_proj.weight_scale": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.77.up_proj.weight": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.77.up_proj.weight_scale": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.78.down_proj.weight": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.78.down_proj.weight_scale": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.78.gate_proj.weight": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.78.gate_proj.weight_scale": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.78.up_proj.weight": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.78.up_proj.weight_scale": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.79.down_proj.weight": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.79.down_proj.weight_scale": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.79.gate_proj.weight": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.79.gate_proj.weight_scale": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.79.up_proj.weight": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.79.up_proj.weight_scale": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.8.down_proj.weight": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.8.down_proj.weight_scale": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.8.gate_proj.weight": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.8.gate_proj.weight_scale": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.8.up_proj.weight": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.8.up_proj.weight_scale": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.80.down_proj.weight": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.80.down_proj.weight_scale": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.80.gate_proj.weight": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.80.gate_proj.weight_scale": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.80.up_proj.weight": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.80.up_proj.weight_scale": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.81.down_proj.weight": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.81.down_proj.weight_scale": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.81.gate_proj.weight": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.81.gate_proj.weight_scale": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.81.up_proj.weight": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.81.up_proj.weight_scale": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.82.down_proj.weight": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.82.down_proj.weight_scale": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.82.gate_proj.weight": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.82.gate_proj.weight_scale": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.82.up_proj.weight": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.82.up_proj.weight_scale": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.83.down_proj.weight": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.83.down_proj.weight_scale": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.83.gate_proj.weight": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.83.gate_proj.weight_scale": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.83.up_proj.weight": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.83.up_proj.weight_scale": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.84.down_proj.weight": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.84.down_proj.weight_scale": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.84.gate_proj.weight": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.84.gate_proj.weight_scale": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.84.up_proj.weight": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.84.up_proj.weight_scale": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.85.down_proj.weight": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.85.down_proj.weight_scale": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.85.gate_proj.weight": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.85.gate_proj.weight_scale": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.85.up_proj.weight": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.85.up_proj.weight_scale": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.86.down_proj.weight": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.86.down_proj.weight_scale": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.86.gate_proj.weight": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.86.gate_proj.weight_scale": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.86.up_proj.weight": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.86.up_proj.weight_scale": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.87.down_proj.weight": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.87.down_proj.weight_scale": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.87.gate_proj.weight": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.87.gate_proj.weight_scale": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.87.up_proj.weight": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.87.up_proj.weight_scale": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.88.down_proj.weight": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.88.down_proj.weight_scale": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.88.gate_proj.weight": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.88.gate_proj.weight_scale": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.88.up_proj.weight": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.88.up_proj.weight_scale": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.89.down_proj.weight": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.89.down_proj.weight_scale": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.89.gate_proj.weight": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.89.gate_proj.weight_scale": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.89.up_proj.weight": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.89.up_proj.weight_scale": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.9.down_proj.weight": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.9.down_proj.weight_scale": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.9.gate_proj.weight": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.9.gate_proj.weight_scale": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.9.up_proj.weight": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.9.up_proj.weight_scale": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.90.down_proj.weight": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.90.down_proj.weight_scale": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.90.gate_proj.weight": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.90.gate_proj.weight_scale": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.90.up_proj.weight": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.90.up_proj.weight_scale": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.91.down_proj.weight": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.91.down_proj.weight_scale": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.91.gate_proj.weight": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.91.gate_proj.weight_scale": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.91.up_proj.weight": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.91.up_proj.weight_scale": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.92.down_proj.weight": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.92.down_proj.weight_scale": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.92.gate_proj.weight": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.92.gate_proj.weight_scale": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.92.up_proj.weight": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.92.up_proj.weight_scale": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.93.down_proj.weight": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.93.down_proj.weight_scale": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.93.gate_proj.weight": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.93.gate_proj.weight_scale": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.93.up_proj.weight": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.93.up_proj.weight_scale": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.94.down_proj.weight": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.94.down_proj.weight_scale": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.94.gate_proj.weight": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.94.gate_proj.weight_scale": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.94.up_proj.weight": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.94.up_proj.weight_scale": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.95.down_proj.weight": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.95.down_proj.weight_scale": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.95.gate_proj.weight": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.95.gate_proj.weight_scale": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.95.up_proj.weight": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.95.up_proj.weight_scale": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.96.down_proj.weight": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.96.down_proj.weight_scale": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.96.gate_proj.weight": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.96.gate_proj.weight_scale": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.96.up_proj.weight": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.96.up_proj.weight_scale": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.97.down_proj.weight": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.97.down_proj.weight_scale": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.97.gate_proj.weight": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.97.gate_proj.weight_scale": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.97.up_proj.weight": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.97.up_proj.weight_scale": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.98.down_proj.weight": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.98.down_proj.weight_scale": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.98.gate_proj.weight": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.98.gate_proj.weight_scale": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.98.up_proj.weight": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.98.up_proj.weight_scale": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.99.down_proj.weight": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.99.down_proj.weight_scale": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.99.gate_proj.weight": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.99.gate_proj.weight_scale": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.99.up_proj.weight": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.99.up_proj.weight_scale": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.gate.e_score_correction_bias": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.gate.weight": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.shared_experts.down_proj.weight": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.shared_experts.down_proj.weight_scale": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.shared_experts.gate_proj.weight": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.shared_experts.gate_proj.weight_scale": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.shared_experts.up_proj.weight": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.shared_experts.up_proj.weight_scale": "model-00006-of-00092.safetensors",
+ "model.layers.5.post_attention_layernorm.weight": "model-00006-of-00092.safetensors",
+ "model.layers.5.self_attn.k_norm.weight": "model-00006-of-00092.safetensors",
+ "model.layers.5.self_attn.k_proj.bias": "model-00006-of-00092.safetensors",
+ "model.layers.5.self_attn.k_proj.weight": "model-00006-of-00092.safetensors",
+ "model.layers.5.self_attn.k_proj.weight_scale": "model-00006-of-00092.safetensors",
+ "model.layers.5.self_attn.o_proj.weight": "model-00006-of-00092.safetensors",
+ "model.layers.5.self_attn.o_proj.weight_scale": "model-00006-of-00092.safetensors",
+ "model.layers.5.self_attn.q_norm.weight": "model-00006-of-00092.safetensors",
+ "model.layers.5.self_attn.q_proj.bias": "model-00006-of-00092.safetensors",
+ "model.layers.5.self_attn.q_proj.weight": "model-00006-of-00092.safetensors",
+ "model.layers.5.self_attn.q_proj.weight_scale": "model-00006-of-00092.safetensors",
+ "model.layers.5.self_attn.v_proj.bias": "model-00006-of-00092.safetensors",
+ "model.layers.5.self_attn.v_proj.weight": "model-00006-of-00092.safetensors",
+ "model.layers.5.self_attn.v_proj.weight_scale": "model-00006-of-00092.safetensors",
+ "model.layers.6.input_layernorm.weight": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.0.down_proj.weight": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.0.down_proj.weight_scale": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.0.gate_proj.weight": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.0.gate_proj.weight_scale": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.0.up_proj.weight": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.0.up_proj.weight_scale": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.1.down_proj.weight": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.1.down_proj.weight_scale": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.1.gate_proj.weight": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.1.gate_proj.weight_scale": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.1.up_proj.weight": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.1.up_proj.weight_scale": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.10.down_proj.weight": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.10.down_proj.weight_scale": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.10.gate_proj.weight": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.10.gate_proj.weight_scale": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.10.up_proj.weight": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.10.up_proj.weight_scale": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.100.down_proj.weight": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.100.down_proj.weight_scale": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.100.gate_proj.weight": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.100.gate_proj.weight_scale": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.100.up_proj.weight": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.100.up_proj.weight_scale": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.101.down_proj.weight": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.101.down_proj.weight_scale": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.101.gate_proj.weight": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.101.gate_proj.weight_scale": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.101.up_proj.weight": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.101.up_proj.weight_scale": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.102.down_proj.weight": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.102.down_proj.weight_scale": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.102.gate_proj.weight": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.102.gate_proj.weight_scale": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.102.up_proj.weight": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.102.up_proj.weight_scale": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.103.down_proj.weight": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.103.down_proj.weight_scale": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.103.gate_proj.weight": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.103.gate_proj.weight_scale": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.103.up_proj.weight": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.103.up_proj.weight_scale": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.104.down_proj.weight": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.104.down_proj.weight_scale": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.104.gate_proj.weight": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.104.gate_proj.weight_scale": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.104.up_proj.weight": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.104.up_proj.weight_scale": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.105.down_proj.weight": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.105.down_proj.weight_scale": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.105.gate_proj.weight": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.105.gate_proj.weight_scale": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.105.up_proj.weight": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.105.up_proj.weight_scale": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.106.down_proj.weight": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.106.down_proj.weight_scale": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.106.gate_proj.weight": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.106.gate_proj.weight_scale": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.106.up_proj.weight": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.106.up_proj.weight_scale": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.107.down_proj.weight": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.107.down_proj.weight_scale": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.107.gate_proj.weight": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.107.gate_proj.weight_scale": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.107.up_proj.weight": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.107.up_proj.weight_scale": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.108.down_proj.weight": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.108.down_proj.weight_scale": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.108.gate_proj.weight": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.108.gate_proj.weight_scale": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.108.up_proj.weight": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.108.up_proj.weight_scale": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.109.down_proj.weight": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.109.down_proj.weight_scale": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.109.gate_proj.weight": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.109.gate_proj.weight_scale": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.109.up_proj.weight": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.109.up_proj.weight_scale": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.11.down_proj.weight": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.11.down_proj.weight_scale": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.11.gate_proj.weight": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.11.gate_proj.weight_scale": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.11.up_proj.weight": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.11.up_proj.weight_scale": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.110.down_proj.weight": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.110.down_proj.weight_scale": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.110.gate_proj.weight": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.110.gate_proj.weight_scale": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.110.up_proj.weight": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.110.up_proj.weight_scale": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.111.down_proj.weight": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.111.down_proj.weight_scale": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.111.gate_proj.weight": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.111.gate_proj.weight_scale": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.111.up_proj.weight": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.111.up_proj.weight_scale": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.112.down_proj.weight": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.112.down_proj.weight_scale": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.112.gate_proj.weight": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.112.gate_proj.weight_scale": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.112.up_proj.weight": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.112.up_proj.weight_scale": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.113.down_proj.weight": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.113.down_proj.weight_scale": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.113.gate_proj.weight": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.113.gate_proj.weight_scale": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.113.up_proj.weight": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.113.up_proj.weight_scale": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.114.down_proj.weight": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.114.down_proj.weight_scale": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.114.gate_proj.weight": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.114.gate_proj.weight_scale": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.114.up_proj.weight": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.114.up_proj.weight_scale": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.115.down_proj.weight": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.115.down_proj.weight_scale": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.115.gate_proj.weight": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.115.gate_proj.weight_scale": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.115.up_proj.weight": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.115.up_proj.weight_scale": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.116.down_proj.weight": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.116.down_proj.weight_scale": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.116.gate_proj.weight": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.116.gate_proj.weight_scale": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.116.up_proj.weight": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.116.up_proj.weight_scale": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.117.down_proj.weight": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.117.down_proj.weight_scale": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.117.gate_proj.weight": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.117.gate_proj.weight_scale": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.117.up_proj.weight": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.117.up_proj.weight_scale": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.118.down_proj.weight": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.118.down_proj.weight_scale": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.118.gate_proj.weight": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.118.gate_proj.weight_scale": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.118.up_proj.weight": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.118.up_proj.weight_scale": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.119.down_proj.weight": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.119.down_proj.weight_scale": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.119.gate_proj.weight": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.119.gate_proj.weight_scale": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.119.up_proj.weight": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.119.up_proj.weight_scale": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.12.down_proj.weight": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.12.down_proj.weight_scale": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.12.gate_proj.weight": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.12.gate_proj.weight_scale": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.12.up_proj.weight": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.12.up_proj.weight_scale": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.120.down_proj.weight": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.120.down_proj.weight_scale": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.120.gate_proj.weight": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.120.gate_proj.weight_scale": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.120.up_proj.weight": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.120.up_proj.weight_scale": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.121.down_proj.weight": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.121.down_proj.weight_scale": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.121.gate_proj.weight": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.121.gate_proj.weight_scale": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.121.up_proj.weight": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.121.up_proj.weight_scale": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.122.down_proj.weight": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.122.down_proj.weight_scale": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.122.gate_proj.weight": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.122.gate_proj.weight_scale": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.122.up_proj.weight": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.122.up_proj.weight_scale": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.123.down_proj.weight": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.123.down_proj.weight_scale": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.123.gate_proj.weight": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.123.gate_proj.weight_scale": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.123.up_proj.weight": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.123.up_proj.weight_scale": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.124.down_proj.weight": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.124.down_proj.weight_scale": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.124.gate_proj.weight": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.124.gate_proj.weight_scale": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.124.up_proj.weight": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.124.up_proj.weight_scale": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.125.down_proj.weight": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.125.down_proj.weight_scale": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.125.gate_proj.weight": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.125.gate_proj.weight_scale": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.125.up_proj.weight": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.125.up_proj.weight_scale": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.126.down_proj.weight": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.126.down_proj.weight_scale": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.126.gate_proj.weight": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.126.gate_proj.weight_scale": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.126.up_proj.weight": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.126.up_proj.weight_scale": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.127.down_proj.weight": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.127.down_proj.weight_scale": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.127.gate_proj.weight": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.127.gate_proj.weight_scale": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.127.up_proj.weight": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.127.up_proj.weight_scale": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.128.down_proj.weight": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.128.down_proj.weight_scale": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.128.gate_proj.weight": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.128.gate_proj.weight_scale": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.128.up_proj.weight": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.128.up_proj.weight_scale": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.129.down_proj.weight": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.129.down_proj.weight_scale": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.129.gate_proj.weight": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.129.gate_proj.weight_scale": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.129.up_proj.weight": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.129.up_proj.weight_scale": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.13.down_proj.weight": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.13.down_proj.weight_scale": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.13.gate_proj.weight": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.13.gate_proj.weight_scale": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.13.up_proj.weight": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.13.up_proj.weight_scale": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.130.down_proj.weight": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.130.down_proj.weight_scale": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.130.gate_proj.weight": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.130.gate_proj.weight_scale": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.130.up_proj.weight": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.130.up_proj.weight_scale": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.131.down_proj.weight": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.131.down_proj.weight_scale": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.131.gate_proj.weight": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.131.gate_proj.weight_scale": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.131.up_proj.weight": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.131.up_proj.weight_scale": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.132.down_proj.weight": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.132.down_proj.weight_scale": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.132.gate_proj.weight": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.132.gate_proj.weight_scale": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.132.up_proj.weight": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.132.up_proj.weight_scale": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.133.down_proj.weight": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.133.down_proj.weight_scale": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.133.gate_proj.weight": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.133.gate_proj.weight_scale": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.133.up_proj.weight": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.133.up_proj.weight_scale": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.134.down_proj.weight": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.134.down_proj.weight_scale": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.134.gate_proj.weight": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.134.gate_proj.weight_scale": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.134.up_proj.weight": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.134.up_proj.weight_scale": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.135.down_proj.weight": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.135.down_proj.weight_scale": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.135.gate_proj.weight": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.135.gate_proj.weight_scale": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.135.up_proj.weight": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.135.up_proj.weight_scale": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.136.down_proj.weight": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.136.down_proj.weight_scale": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.136.gate_proj.weight": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.136.gate_proj.weight_scale": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.136.up_proj.weight": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.136.up_proj.weight_scale": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.137.down_proj.weight": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.137.down_proj.weight_scale": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.137.gate_proj.weight": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.137.gate_proj.weight_scale": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.137.up_proj.weight": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.137.up_proj.weight_scale": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.138.down_proj.weight": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.138.down_proj.weight_scale": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.138.gate_proj.weight": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.138.gate_proj.weight_scale": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.138.up_proj.weight": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.138.up_proj.weight_scale": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.139.down_proj.weight": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.139.down_proj.weight_scale": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.139.gate_proj.weight": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.139.gate_proj.weight_scale": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.139.up_proj.weight": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.139.up_proj.weight_scale": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.14.down_proj.weight": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.14.down_proj.weight_scale": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.14.gate_proj.weight": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.14.gate_proj.weight_scale": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.14.up_proj.weight": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.14.up_proj.weight_scale": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.140.down_proj.weight": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.140.down_proj.weight_scale": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.140.gate_proj.weight": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.140.gate_proj.weight_scale": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.140.up_proj.weight": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.140.up_proj.weight_scale": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.141.down_proj.weight": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.141.down_proj.weight_scale": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.141.gate_proj.weight": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.141.gate_proj.weight_scale": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.141.up_proj.weight": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.141.up_proj.weight_scale": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.142.down_proj.weight": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.142.down_proj.weight_scale": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.142.gate_proj.weight": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.142.gate_proj.weight_scale": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.142.up_proj.weight": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.142.up_proj.weight_scale": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.143.down_proj.weight": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.143.down_proj.weight_scale": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.143.gate_proj.weight": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.143.gate_proj.weight_scale": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.143.up_proj.weight": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.143.up_proj.weight_scale": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.144.down_proj.weight": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.144.down_proj.weight_scale": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.144.gate_proj.weight": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.144.gate_proj.weight_scale": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.144.up_proj.weight": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.144.up_proj.weight_scale": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.145.down_proj.weight": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.145.down_proj.weight_scale": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.145.gate_proj.weight": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.145.gate_proj.weight_scale": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.145.up_proj.weight": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.145.up_proj.weight_scale": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.146.down_proj.weight": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.146.down_proj.weight_scale": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.146.gate_proj.weight": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.146.gate_proj.weight_scale": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.146.up_proj.weight": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.146.up_proj.weight_scale": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.147.down_proj.weight": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.147.down_proj.weight_scale": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.147.gate_proj.weight": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.147.gate_proj.weight_scale": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.147.up_proj.weight": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.147.up_proj.weight_scale": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.148.down_proj.weight": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.148.down_proj.weight_scale": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.148.gate_proj.weight": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.148.gate_proj.weight_scale": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.148.up_proj.weight": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.148.up_proj.weight_scale": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.149.down_proj.weight": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.149.down_proj.weight_scale": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.149.gate_proj.weight": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.149.gate_proj.weight_scale": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.149.up_proj.weight": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.149.up_proj.weight_scale": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.15.down_proj.weight": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.15.down_proj.weight_scale": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.15.gate_proj.weight": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.15.gate_proj.weight_scale": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.15.up_proj.weight": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.15.up_proj.weight_scale": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.150.down_proj.weight": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.150.down_proj.weight_scale": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.150.gate_proj.weight": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.150.gate_proj.weight_scale": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.150.up_proj.weight": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.150.up_proj.weight_scale": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.151.down_proj.weight": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.151.down_proj.weight_scale": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.151.gate_proj.weight": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.151.gate_proj.weight_scale": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.151.up_proj.weight": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.151.up_proj.weight_scale": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.152.down_proj.weight": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.152.down_proj.weight_scale": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.152.gate_proj.weight": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.152.gate_proj.weight_scale": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.152.up_proj.weight": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.152.up_proj.weight_scale": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.153.down_proj.weight": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.153.down_proj.weight_scale": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.153.gate_proj.weight": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.153.gate_proj.weight_scale": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.153.up_proj.weight": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.153.up_proj.weight_scale": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.154.down_proj.weight": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.154.down_proj.weight_scale": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.154.gate_proj.weight": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.154.gate_proj.weight_scale": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.154.up_proj.weight": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.154.up_proj.weight_scale": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.155.down_proj.weight": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.155.down_proj.weight_scale": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.155.gate_proj.weight": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.155.gate_proj.weight_scale": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.155.up_proj.weight": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.155.up_proj.weight_scale": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.156.down_proj.weight": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.156.down_proj.weight_scale": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.156.gate_proj.weight": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.156.gate_proj.weight_scale": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.156.up_proj.weight": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.156.up_proj.weight_scale": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.157.down_proj.weight": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.157.down_proj.weight_scale": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.157.gate_proj.weight": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.157.gate_proj.weight_scale": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.157.up_proj.weight": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.157.up_proj.weight_scale": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.158.down_proj.weight": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.158.down_proj.weight_scale": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.158.gate_proj.weight": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.158.gate_proj.weight_scale": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.158.up_proj.weight": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.158.up_proj.weight_scale": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.159.down_proj.weight": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.159.down_proj.weight_scale": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.159.gate_proj.weight": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.159.gate_proj.weight_scale": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.159.up_proj.weight": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.159.up_proj.weight_scale": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.16.down_proj.weight": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.16.down_proj.weight_scale": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.16.gate_proj.weight": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.16.gate_proj.weight_scale": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.16.up_proj.weight": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.16.up_proj.weight_scale": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.17.down_proj.weight": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.17.down_proj.weight_scale": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.17.gate_proj.weight": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.17.gate_proj.weight_scale": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.17.up_proj.weight": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.17.up_proj.weight_scale": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.18.down_proj.weight": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.18.down_proj.weight_scale": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.18.gate_proj.weight": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.18.gate_proj.weight_scale": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.18.up_proj.weight": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.18.up_proj.weight_scale": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.19.down_proj.weight": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.19.down_proj.weight_scale": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.19.gate_proj.weight": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.19.gate_proj.weight_scale": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.19.up_proj.weight": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.19.up_proj.weight_scale": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.2.down_proj.weight": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.2.down_proj.weight_scale": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.2.gate_proj.weight": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.2.gate_proj.weight_scale": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.2.up_proj.weight": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.2.up_proj.weight_scale": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.20.down_proj.weight": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.20.down_proj.weight_scale": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.20.gate_proj.weight": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.20.gate_proj.weight_scale": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.20.up_proj.weight": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.20.up_proj.weight_scale": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.21.down_proj.weight": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.21.down_proj.weight_scale": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.21.gate_proj.weight": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.21.gate_proj.weight_scale": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.21.up_proj.weight": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.21.up_proj.weight_scale": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.22.down_proj.weight": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.22.down_proj.weight_scale": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.22.gate_proj.weight": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.22.gate_proj.weight_scale": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.22.up_proj.weight": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.22.up_proj.weight_scale": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.23.down_proj.weight": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.23.down_proj.weight_scale": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.23.gate_proj.weight": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.23.gate_proj.weight_scale": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.23.up_proj.weight": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.23.up_proj.weight_scale": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.24.down_proj.weight": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.24.down_proj.weight_scale": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.24.gate_proj.weight": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.24.gate_proj.weight_scale": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.24.up_proj.weight": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.24.up_proj.weight_scale": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.25.down_proj.weight": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.25.down_proj.weight_scale": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.25.gate_proj.weight": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.25.gate_proj.weight_scale": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.25.up_proj.weight": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.25.up_proj.weight_scale": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.26.down_proj.weight": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.26.down_proj.weight_scale": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.26.gate_proj.weight": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.26.gate_proj.weight_scale": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.26.up_proj.weight": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.26.up_proj.weight_scale": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.27.down_proj.weight": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.27.down_proj.weight_scale": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.27.gate_proj.weight": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.27.gate_proj.weight_scale": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.27.up_proj.weight": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.27.up_proj.weight_scale": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.28.down_proj.weight": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.28.down_proj.weight_scale": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.28.gate_proj.weight": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.28.gate_proj.weight_scale": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.28.up_proj.weight": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.28.up_proj.weight_scale": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.29.down_proj.weight": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.29.down_proj.weight_scale": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.29.gate_proj.weight": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.29.gate_proj.weight_scale": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.29.up_proj.weight": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.29.up_proj.weight_scale": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.3.down_proj.weight": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.3.down_proj.weight_scale": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.3.gate_proj.weight": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.3.gate_proj.weight_scale": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.3.up_proj.weight": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.3.up_proj.weight_scale": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.30.down_proj.weight": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.30.down_proj.weight_scale": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.30.gate_proj.weight": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.30.gate_proj.weight_scale": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.30.up_proj.weight": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.30.up_proj.weight_scale": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.31.down_proj.weight": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.31.down_proj.weight_scale": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.31.gate_proj.weight": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.31.gate_proj.weight_scale": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.31.up_proj.weight": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.31.up_proj.weight_scale": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.32.down_proj.weight": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.32.down_proj.weight_scale": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.32.gate_proj.weight": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.32.gate_proj.weight_scale": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.32.up_proj.weight": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.32.up_proj.weight_scale": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.33.down_proj.weight": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.33.down_proj.weight_scale": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.33.gate_proj.weight": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.33.gate_proj.weight_scale": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.33.up_proj.weight": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.33.up_proj.weight_scale": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.34.down_proj.weight": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.34.down_proj.weight_scale": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.34.gate_proj.weight": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.34.gate_proj.weight_scale": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.34.up_proj.weight": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.34.up_proj.weight_scale": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.35.down_proj.weight": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.35.down_proj.weight_scale": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.35.gate_proj.weight": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.35.gate_proj.weight_scale": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.35.up_proj.weight": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.35.up_proj.weight_scale": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.36.down_proj.weight": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.36.down_proj.weight_scale": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.36.gate_proj.weight": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.36.gate_proj.weight_scale": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.36.up_proj.weight": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.36.up_proj.weight_scale": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.37.down_proj.weight": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.37.down_proj.weight_scale": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.37.gate_proj.weight": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.37.gate_proj.weight_scale": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.37.up_proj.weight": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.37.up_proj.weight_scale": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.38.down_proj.weight": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.38.down_proj.weight_scale": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.38.gate_proj.weight": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.38.gate_proj.weight_scale": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.38.up_proj.weight": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.38.up_proj.weight_scale": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.39.down_proj.weight": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.39.down_proj.weight_scale": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.39.gate_proj.weight": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.39.gate_proj.weight_scale": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.39.up_proj.weight": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.39.up_proj.weight_scale": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.4.down_proj.weight": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.4.down_proj.weight_scale": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.4.gate_proj.weight": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.4.gate_proj.weight_scale": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.4.up_proj.weight": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.4.up_proj.weight_scale": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.40.down_proj.weight": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.40.down_proj.weight_scale": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.40.gate_proj.weight": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.40.gate_proj.weight_scale": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.40.up_proj.weight": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.40.up_proj.weight_scale": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.41.down_proj.weight": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.41.down_proj.weight_scale": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.41.gate_proj.weight": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.41.gate_proj.weight_scale": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.41.up_proj.weight": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.41.up_proj.weight_scale": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.42.down_proj.weight": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.42.down_proj.weight_scale": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.42.gate_proj.weight": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.42.gate_proj.weight_scale": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.42.up_proj.weight": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.42.up_proj.weight_scale": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.43.down_proj.weight": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.43.down_proj.weight_scale": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.43.gate_proj.weight": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.43.gate_proj.weight_scale": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.43.up_proj.weight": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.43.up_proj.weight_scale": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.44.down_proj.weight": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.44.down_proj.weight_scale": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.44.gate_proj.weight": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.44.gate_proj.weight_scale": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.44.up_proj.weight": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.44.up_proj.weight_scale": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.45.down_proj.weight": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.45.down_proj.weight_scale": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.45.gate_proj.weight": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.45.gate_proj.weight_scale": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.45.up_proj.weight": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.45.up_proj.weight_scale": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.46.down_proj.weight": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.46.down_proj.weight_scale": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.46.gate_proj.weight": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.46.gate_proj.weight_scale": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.46.up_proj.weight": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.46.up_proj.weight_scale": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.47.down_proj.weight": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.47.down_proj.weight_scale": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.47.gate_proj.weight": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.47.gate_proj.weight_scale": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.47.up_proj.weight": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.47.up_proj.weight_scale": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.48.down_proj.weight": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.48.down_proj.weight_scale": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.48.gate_proj.weight": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.48.gate_proj.weight_scale": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.48.up_proj.weight": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.48.up_proj.weight_scale": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.49.down_proj.weight": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.49.down_proj.weight_scale": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.49.gate_proj.weight": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.49.gate_proj.weight_scale": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.49.up_proj.weight": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.49.up_proj.weight_scale": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.5.down_proj.weight": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.5.down_proj.weight_scale": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.5.gate_proj.weight": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.5.gate_proj.weight_scale": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.5.up_proj.weight": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.5.up_proj.weight_scale": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.50.down_proj.weight": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.50.down_proj.weight_scale": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.50.gate_proj.weight": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.50.gate_proj.weight_scale": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.50.up_proj.weight": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.50.up_proj.weight_scale": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.51.down_proj.weight": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.51.down_proj.weight_scale": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.51.gate_proj.weight": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.51.gate_proj.weight_scale": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.51.up_proj.weight": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.51.up_proj.weight_scale": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.52.down_proj.weight": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.52.down_proj.weight_scale": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.52.gate_proj.weight": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.52.gate_proj.weight_scale": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.52.up_proj.weight": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.52.up_proj.weight_scale": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.53.down_proj.weight": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.53.down_proj.weight_scale": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.53.gate_proj.weight": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.53.gate_proj.weight_scale": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.53.up_proj.weight": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.53.up_proj.weight_scale": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.54.down_proj.weight": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.54.down_proj.weight_scale": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.54.gate_proj.weight": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.54.gate_proj.weight_scale": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.54.up_proj.weight": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.54.up_proj.weight_scale": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.55.down_proj.weight": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.55.down_proj.weight_scale": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.55.gate_proj.weight": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.55.gate_proj.weight_scale": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.55.up_proj.weight": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.55.up_proj.weight_scale": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.56.down_proj.weight": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.56.down_proj.weight_scale": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.56.gate_proj.weight": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.56.gate_proj.weight_scale": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.56.up_proj.weight": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.56.up_proj.weight_scale": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.57.down_proj.weight": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.57.down_proj.weight_scale": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.57.gate_proj.weight": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.57.gate_proj.weight_scale": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.57.up_proj.weight": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.57.up_proj.weight_scale": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.58.down_proj.weight": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.58.down_proj.weight_scale": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.58.gate_proj.weight": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.58.gate_proj.weight_scale": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.58.up_proj.weight": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.58.up_proj.weight_scale": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.59.down_proj.weight": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.59.down_proj.weight_scale": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.59.gate_proj.weight": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.59.gate_proj.weight_scale": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.59.up_proj.weight": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.59.up_proj.weight_scale": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.6.down_proj.weight": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.6.down_proj.weight_scale": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.6.gate_proj.weight": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.6.gate_proj.weight_scale": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.6.up_proj.weight": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.6.up_proj.weight_scale": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.60.down_proj.weight": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.60.down_proj.weight_scale": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.60.gate_proj.weight": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.60.gate_proj.weight_scale": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.60.up_proj.weight": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.60.up_proj.weight_scale": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.61.down_proj.weight": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.61.down_proj.weight_scale": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.61.gate_proj.weight": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.61.gate_proj.weight_scale": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.61.up_proj.weight": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.61.up_proj.weight_scale": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.62.down_proj.weight": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.62.down_proj.weight_scale": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.62.gate_proj.weight": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.62.gate_proj.weight_scale": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.62.up_proj.weight": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.62.up_proj.weight_scale": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.63.down_proj.weight": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.63.down_proj.weight_scale": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.63.gate_proj.weight": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.63.gate_proj.weight_scale": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.63.up_proj.weight": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.63.up_proj.weight_scale": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.64.down_proj.weight": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.64.down_proj.weight_scale": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.64.gate_proj.weight": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.64.gate_proj.weight_scale": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.64.up_proj.weight": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.64.up_proj.weight_scale": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.65.down_proj.weight": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.65.down_proj.weight_scale": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.65.gate_proj.weight": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.65.gate_proj.weight_scale": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.65.up_proj.weight": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.65.up_proj.weight_scale": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.66.down_proj.weight": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.66.down_proj.weight_scale": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.66.gate_proj.weight": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.66.gate_proj.weight_scale": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.66.up_proj.weight": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.66.up_proj.weight_scale": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.67.down_proj.weight": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.67.down_proj.weight_scale": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.67.gate_proj.weight": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.67.gate_proj.weight_scale": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.67.up_proj.weight": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.67.up_proj.weight_scale": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.68.down_proj.weight": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.68.down_proj.weight_scale": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.68.gate_proj.weight": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.68.gate_proj.weight_scale": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.68.up_proj.weight": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.68.up_proj.weight_scale": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.69.down_proj.weight": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.69.down_proj.weight_scale": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.69.gate_proj.weight": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.69.gate_proj.weight_scale": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.69.up_proj.weight": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.69.up_proj.weight_scale": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.7.down_proj.weight": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.7.down_proj.weight_scale": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.7.gate_proj.weight": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.7.gate_proj.weight_scale": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.7.up_proj.weight": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.7.up_proj.weight_scale": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.70.down_proj.weight": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.70.down_proj.weight_scale": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.70.gate_proj.weight": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.70.gate_proj.weight_scale": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.70.up_proj.weight": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.70.up_proj.weight_scale": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.71.down_proj.weight": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.71.down_proj.weight_scale": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.71.gate_proj.weight": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.71.gate_proj.weight_scale": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.71.up_proj.weight": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.71.up_proj.weight_scale": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.72.down_proj.weight": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.72.down_proj.weight_scale": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.72.gate_proj.weight": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.72.gate_proj.weight_scale": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.72.up_proj.weight": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.72.up_proj.weight_scale": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.73.down_proj.weight": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.73.down_proj.weight_scale": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.73.gate_proj.weight": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.73.gate_proj.weight_scale": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.73.up_proj.weight": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.73.up_proj.weight_scale": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.74.down_proj.weight": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.74.down_proj.weight_scale": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.74.gate_proj.weight": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.74.gate_proj.weight_scale": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.74.up_proj.weight": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.74.up_proj.weight_scale": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.75.down_proj.weight": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.75.down_proj.weight_scale": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.75.gate_proj.weight": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.75.gate_proj.weight_scale": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.75.up_proj.weight": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.75.up_proj.weight_scale": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.76.down_proj.weight": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.76.down_proj.weight_scale": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.76.gate_proj.weight": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.76.gate_proj.weight_scale": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.76.up_proj.weight": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.76.up_proj.weight_scale": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.77.down_proj.weight": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.77.down_proj.weight_scale": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.77.gate_proj.weight": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.77.gate_proj.weight_scale": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.77.up_proj.weight": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.77.up_proj.weight_scale": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.78.down_proj.weight": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.78.down_proj.weight_scale": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.78.gate_proj.weight": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.78.gate_proj.weight_scale": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.78.up_proj.weight": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.78.up_proj.weight_scale": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.79.down_proj.weight": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.79.down_proj.weight_scale": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.79.gate_proj.weight": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.79.gate_proj.weight_scale": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.79.up_proj.weight": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.79.up_proj.weight_scale": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.8.down_proj.weight": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.8.down_proj.weight_scale": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.8.gate_proj.weight": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.8.gate_proj.weight_scale": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.8.up_proj.weight": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.8.up_proj.weight_scale": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.80.down_proj.weight": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.80.down_proj.weight_scale": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.80.gate_proj.weight": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.80.gate_proj.weight_scale": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.80.up_proj.weight": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.80.up_proj.weight_scale": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.81.down_proj.weight": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.81.down_proj.weight_scale": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.81.gate_proj.weight": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.81.gate_proj.weight_scale": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.81.up_proj.weight": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.81.up_proj.weight_scale": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.82.down_proj.weight": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.82.down_proj.weight_scale": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.82.gate_proj.weight": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.82.gate_proj.weight_scale": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.82.up_proj.weight": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.82.up_proj.weight_scale": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.83.down_proj.weight": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.83.down_proj.weight_scale": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.83.gate_proj.weight": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.83.gate_proj.weight_scale": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.83.up_proj.weight": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.83.up_proj.weight_scale": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.84.down_proj.weight": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.84.down_proj.weight_scale": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.84.gate_proj.weight": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.84.gate_proj.weight_scale": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.84.up_proj.weight": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.84.up_proj.weight_scale": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.85.down_proj.weight": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.85.down_proj.weight_scale": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.85.gate_proj.weight": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.85.gate_proj.weight_scale": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.85.up_proj.weight": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.85.up_proj.weight_scale": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.86.down_proj.weight": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.86.down_proj.weight_scale": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.86.gate_proj.weight": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.86.gate_proj.weight_scale": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.86.up_proj.weight": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.86.up_proj.weight_scale": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.87.down_proj.weight": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.87.down_proj.weight_scale": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.87.gate_proj.weight": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.87.gate_proj.weight_scale": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.87.up_proj.weight": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.87.up_proj.weight_scale": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.88.down_proj.weight": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.88.down_proj.weight_scale": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.88.gate_proj.weight": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.88.gate_proj.weight_scale": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.88.up_proj.weight": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.88.up_proj.weight_scale": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.89.down_proj.weight": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.89.down_proj.weight_scale": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.89.gate_proj.weight": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.89.gate_proj.weight_scale": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.89.up_proj.weight": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.89.up_proj.weight_scale": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.9.down_proj.weight": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.9.down_proj.weight_scale": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.9.gate_proj.weight": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.9.gate_proj.weight_scale": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.9.up_proj.weight": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.9.up_proj.weight_scale": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.90.down_proj.weight": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.90.down_proj.weight_scale": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.90.gate_proj.weight": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.90.gate_proj.weight_scale": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.90.up_proj.weight": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.90.up_proj.weight_scale": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.91.down_proj.weight": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.91.down_proj.weight_scale": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.91.gate_proj.weight": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.91.gate_proj.weight_scale": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.91.up_proj.weight": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.91.up_proj.weight_scale": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.92.down_proj.weight": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.92.down_proj.weight_scale": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.92.gate_proj.weight": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.92.gate_proj.weight_scale": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.92.up_proj.weight": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.92.up_proj.weight_scale": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.93.down_proj.weight": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.93.down_proj.weight_scale": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.93.gate_proj.weight": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.93.gate_proj.weight_scale": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.93.up_proj.weight": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.93.up_proj.weight_scale": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.94.down_proj.weight": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.94.down_proj.weight_scale": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.94.gate_proj.weight": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.94.gate_proj.weight_scale": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.94.up_proj.weight": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.94.up_proj.weight_scale": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.95.down_proj.weight": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.95.down_proj.weight_scale": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.95.gate_proj.weight": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.95.gate_proj.weight_scale": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.95.up_proj.weight": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.95.up_proj.weight_scale": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.96.down_proj.weight": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.96.down_proj.weight_scale": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.96.gate_proj.weight": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.96.gate_proj.weight_scale": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.96.up_proj.weight": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.96.up_proj.weight_scale": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.97.down_proj.weight": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.97.down_proj.weight_scale": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.97.gate_proj.weight": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.97.gate_proj.weight_scale": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.97.up_proj.weight": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.97.up_proj.weight_scale": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.98.down_proj.weight": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.98.down_proj.weight_scale": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.98.gate_proj.weight": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.98.gate_proj.weight_scale": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.98.up_proj.weight": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.98.up_proj.weight_scale": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.99.down_proj.weight": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.99.down_proj.weight_scale": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.99.gate_proj.weight": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.99.gate_proj.weight_scale": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.99.up_proj.weight": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.99.up_proj.weight_scale": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.gate.e_score_correction_bias": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.gate.weight": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.shared_experts.down_proj.weight": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.shared_experts.down_proj.weight_scale": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.shared_experts.gate_proj.weight": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.shared_experts.gate_proj.weight_scale": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.shared_experts.up_proj.weight": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.shared_experts.up_proj.weight_scale": "model-00007-of-00092.safetensors",
+ "model.layers.6.post_attention_layernorm.weight": "model-00007-of-00092.safetensors",
+ "model.layers.6.self_attn.k_norm.weight": "model-00007-of-00092.safetensors",
+ "model.layers.6.self_attn.k_proj.bias": "model-00007-of-00092.safetensors",
+ "model.layers.6.self_attn.k_proj.weight": "model-00007-of-00092.safetensors",
+ "model.layers.6.self_attn.k_proj.weight_scale": "model-00007-of-00092.safetensors",
+ "model.layers.6.self_attn.o_proj.weight": "model-00007-of-00092.safetensors",
+ "model.layers.6.self_attn.o_proj.weight_scale": "model-00007-of-00092.safetensors",
+ "model.layers.6.self_attn.q_norm.weight": "model-00007-of-00092.safetensors",
+ "model.layers.6.self_attn.q_proj.bias": "model-00007-of-00092.safetensors",
+ "model.layers.6.self_attn.q_proj.weight": "model-00007-of-00092.safetensors",
+ "model.layers.6.self_attn.q_proj.weight_scale": "model-00007-of-00092.safetensors",
+ "model.layers.6.self_attn.v_proj.bias": "model-00007-of-00092.safetensors",
+ "model.layers.6.self_attn.v_proj.weight": "model-00007-of-00092.safetensors",
+ "model.layers.6.self_attn.v_proj.weight_scale": "model-00007-of-00092.safetensors",
+ "model.layers.7.input_layernorm.weight": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.0.down_proj.weight": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.0.down_proj.weight_scale": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.0.gate_proj.weight": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.0.gate_proj.weight_scale": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.0.up_proj.weight": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.0.up_proj.weight_scale": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.1.down_proj.weight": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.1.down_proj.weight_scale": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.1.gate_proj.weight": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.1.gate_proj.weight_scale": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.1.up_proj.weight": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.1.up_proj.weight_scale": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.10.down_proj.weight": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.10.down_proj.weight_scale": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.10.gate_proj.weight": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.10.gate_proj.weight_scale": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.10.up_proj.weight": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.10.up_proj.weight_scale": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.100.down_proj.weight": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.100.down_proj.weight_scale": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.100.gate_proj.weight": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.100.gate_proj.weight_scale": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.100.up_proj.weight": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.100.up_proj.weight_scale": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.101.down_proj.weight": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.101.down_proj.weight_scale": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.101.gate_proj.weight": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.101.gate_proj.weight_scale": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.101.up_proj.weight": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.101.up_proj.weight_scale": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.102.down_proj.weight": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.102.down_proj.weight_scale": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.102.gate_proj.weight": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.102.gate_proj.weight_scale": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.102.up_proj.weight": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.102.up_proj.weight_scale": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.103.down_proj.weight": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.103.down_proj.weight_scale": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.103.gate_proj.weight": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.103.gate_proj.weight_scale": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.103.up_proj.weight": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.103.up_proj.weight_scale": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.104.down_proj.weight": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.104.down_proj.weight_scale": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.104.gate_proj.weight": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.104.gate_proj.weight_scale": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.104.up_proj.weight": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.104.up_proj.weight_scale": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.105.down_proj.weight": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.105.down_proj.weight_scale": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.105.gate_proj.weight": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.105.gate_proj.weight_scale": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.105.up_proj.weight": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.105.up_proj.weight_scale": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.106.down_proj.weight": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.106.down_proj.weight_scale": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.106.gate_proj.weight": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.106.gate_proj.weight_scale": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.106.up_proj.weight": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.106.up_proj.weight_scale": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.107.down_proj.weight": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.107.down_proj.weight_scale": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.107.gate_proj.weight": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.107.gate_proj.weight_scale": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.107.up_proj.weight": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.107.up_proj.weight_scale": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.108.down_proj.weight": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.108.down_proj.weight_scale": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.108.gate_proj.weight": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.108.gate_proj.weight_scale": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.108.up_proj.weight": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.108.up_proj.weight_scale": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.109.down_proj.weight": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.109.down_proj.weight_scale": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.109.gate_proj.weight": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.109.gate_proj.weight_scale": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.109.up_proj.weight": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.109.up_proj.weight_scale": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.11.down_proj.weight": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.11.down_proj.weight_scale": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.11.gate_proj.weight": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.11.gate_proj.weight_scale": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.11.up_proj.weight": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.11.up_proj.weight_scale": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.110.down_proj.weight": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.110.down_proj.weight_scale": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.110.gate_proj.weight": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.110.gate_proj.weight_scale": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.110.up_proj.weight": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.110.up_proj.weight_scale": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.111.down_proj.weight": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.111.down_proj.weight_scale": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.111.gate_proj.weight": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.111.gate_proj.weight_scale": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.111.up_proj.weight": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.111.up_proj.weight_scale": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.112.down_proj.weight": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.112.down_proj.weight_scale": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.112.gate_proj.weight": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.112.gate_proj.weight_scale": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.112.up_proj.weight": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.112.up_proj.weight_scale": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.113.down_proj.weight": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.113.down_proj.weight_scale": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.113.gate_proj.weight": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.113.gate_proj.weight_scale": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.113.up_proj.weight": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.113.up_proj.weight_scale": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.114.down_proj.weight": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.114.down_proj.weight_scale": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.114.gate_proj.weight": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.114.gate_proj.weight_scale": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.114.up_proj.weight": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.114.up_proj.weight_scale": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.115.down_proj.weight": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.115.down_proj.weight_scale": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.115.gate_proj.weight": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.115.gate_proj.weight_scale": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.115.up_proj.weight": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.115.up_proj.weight_scale": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.116.down_proj.weight": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.116.down_proj.weight_scale": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.116.gate_proj.weight": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.116.gate_proj.weight_scale": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.116.up_proj.weight": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.116.up_proj.weight_scale": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.117.down_proj.weight": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.117.down_proj.weight_scale": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.117.gate_proj.weight": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.117.gate_proj.weight_scale": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.117.up_proj.weight": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.117.up_proj.weight_scale": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.118.down_proj.weight": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.118.down_proj.weight_scale": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.118.gate_proj.weight": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.118.gate_proj.weight_scale": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.118.up_proj.weight": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.118.up_proj.weight_scale": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.119.down_proj.weight": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.119.down_proj.weight_scale": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.119.gate_proj.weight": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.119.gate_proj.weight_scale": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.119.up_proj.weight": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.119.up_proj.weight_scale": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.12.down_proj.weight": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.12.down_proj.weight_scale": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.12.gate_proj.weight": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.12.gate_proj.weight_scale": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.12.up_proj.weight": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.12.up_proj.weight_scale": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.120.down_proj.weight": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.120.down_proj.weight_scale": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.120.gate_proj.weight": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.120.gate_proj.weight_scale": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.120.up_proj.weight": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.120.up_proj.weight_scale": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.121.down_proj.weight": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.121.down_proj.weight_scale": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.121.gate_proj.weight": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.121.gate_proj.weight_scale": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.121.up_proj.weight": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.121.up_proj.weight_scale": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.122.down_proj.weight": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.122.down_proj.weight_scale": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.122.gate_proj.weight": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.122.gate_proj.weight_scale": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.122.up_proj.weight": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.122.up_proj.weight_scale": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.123.down_proj.weight": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.123.down_proj.weight_scale": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.123.gate_proj.weight": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.123.gate_proj.weight_scale": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.123.up_proj.weight": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.123.up_proj.weight_scale": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.124.down_proj.weight": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.124.down_proj.weight_scale": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.124.gate_proj.weight": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.124.gate_proj.weight_scale": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.124.up_proj.weight": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.124.up_proj.weight_scale": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.125.down_proj.weight": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.125.down_proj.weight_scale": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.125.gate_proj.weight": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.125.gate_proj.weight_scale": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.125.up_proj.weight": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.125.up_proj.weight_scale": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.126.down_proj.weight": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.126.down_proj.weight_scale": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.126.gate_proj.weight": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.126.gate_proj.weight_scale": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.126.up_proj.weight": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.126.up_proj.weight_scale": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.127.down_proj.weight": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.127.down_proj.weight_scale": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.127.gate_proj.weight": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.127.gate_proj.weight_scale": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.127.up_proj.weight": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.127.up_proj.weight_scale": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.128.down_proj.weight": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.128.down_proj.weight_scale": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.128.gate_proj.weight": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.128.gate_proj.weight_scale": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.128.up_proj.weight": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.128.up_proj.weight_scale": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.129.down_proj.weight": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.129.down_proj.weight_scale": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.129.gate_proj.weight": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.129.gate_proj.weight_scale": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.129.up_proj.weight": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.129.up_proj.weight_scale": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.13.down_proj.weight": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.13.down_proj.weight_scale": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.13.gate_proj.weight": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.13.gate_proj.weight_scale": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.13.up_proj.weight": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.13.up_proj.weight_scale": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.130.down_proj.weight": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.130.down_proj.weight_scale": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.130.gate_proj.weight": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.130.gate_proj.weight_scale": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.130.up_proj.weight": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.130.up_proj.weight_scale": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.131.down_proj.weight": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.131.down_proj.weight_scale": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.131.gate_proj.weight": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.131.gate_proj.weight_scale": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.131.up_proj.weight": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.131.up_proj.weight_scale": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.132.down_proj.weight": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.132.down_proj.weight_scale": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.132.gate_proj.weight": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.132.gate_proj.weight_scale": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.132.up_proj.weight": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.132.up_proj.weight_scale": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.133.down_proj.weight": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.133.down_proj.weight_scale": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.133.gate_proj.weight": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.133.gate_proj.weight_scale": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.133.up_proj.weight": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.133.up_proj.weight_scale": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.134.down_proj.weight": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.134.down_proj.weight_scale": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.134.gate_proj.weight": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.134.gate_proj.weight_scale": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.134.up_proj.weight": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.134.up_proj.weight_scale": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.135.down_proj.weight": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.135.down_proj.weight_scale": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.135.gate_proj.weight": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.135.gate_proj.weight_scale": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.135.up_proj.weight": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.135.up_proj.weight_scale": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.136.down_proj.weight": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.136.down_proj.weight_scale": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.136.gate_proj.weight": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.136.gate_proj.weight_scale": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.136.up_proj.weight": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.136.up_proj.weight_scale": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.137.down_proj.weight": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.137.down_proj.weight_scale": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.137.gate_proj.weight": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.137.gate_proj.weight_scale": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.137.up_proj.weight": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.137.up_proj.weight_scale": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.138.down_proj.weight": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.138.down_proj.weight_scale": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.138.gate_proj.weight": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.138.gate_proj.weight_scale": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.138.up_proj.weight": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.138.up_proj.weight_scale": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.139.down_proj.weight": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.139.down_proj.weight_scale": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.139.gate_proj.weight": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.139.gate_proj.weight_scale": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.139.up_proj.weight": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.139.up_proj.weight_scale": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.14.down_proj.weight": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.14.down_proj.weight_scale": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.14.gate_proj.weight": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.14.gate_proj.weight_scale": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.14.up_proj.weight": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.14.up_proj.weight_scale": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.140.down_proj.weight": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.140.down_proj.weight_scale": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.140.gate_proj.weight": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.140.gate_proj.weight_scale": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.140.up_proj.weight": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.140.up_proj.weight_scale": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.141.down_proj.weight": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.141.down_proj.weight_scale": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.141.gate_proj.weight": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.141.gate_proj.weight_scale": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.141.up_proj.weight": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.141.up_proj.weight_scale": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.142.down_proj.weight": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.142.down_proj.weight_scale": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.142.gate_proj.weight": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.142.gate_proj.weight_scale": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.142.up_proj.weight": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.142.up_proj.weight_scale": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.143.down_proj.weight": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.143.down_proj.weight_scale": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.143.gate_proj.weight": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.143.gate_proj.weight_scale": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.143.up_proj.weight": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.143.up_proj.weight_scale": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.144.down_proj.weight": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.144.down_proj.weight_scale": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.144.gate_proj.weight": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.144.gate_proj.weight_scale": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.144.up_proj.weight": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.144.up_proj.weight_scale": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.145.down_proj.weight": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.145.down_proj.weight_scale": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.145.gate_proj.weight": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.145.gate_proj.weight_scale": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.145.up_proj.weight": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.145.up_proj.weight_scale": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.146.down_proj.weight": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.146.down_proj.weight_scale": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.146.gate_proj.weight": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.146.gate_proj.weight_scale": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.146.up_proj.weight": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.146.up_proj.weight_scale": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.147.down_proj.weight": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.147.down_proj.weight_scale": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.147.gate_proj.weight": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.147.gate_proj.weight_scale": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.147.up_proj.weight": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.147.up_proj.weight_scale": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.148.down_proj.weight": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.148.down_proj.weight_scale": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.148.gate_proj.weight": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.148.gate_proj.weight_scale": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.148.up_proj.weight": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.148.up_proj.weight_scale": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.149.down_proj.weight": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.149.down_proj.weight_scale": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.149.gate_proj.weight": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.149.gate_proj.weight_scale": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.149.up_proj.weight": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.149.up_proj.weight_scale": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.15.down_proj.weight": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.15.down_proj.weight_scale": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.15.gate_proj.weight": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.15.gate_proj.weight_scale": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.15.up_proj.weight": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.15.up_proj.weight_scale": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.150.down_proj.weight": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.150.down_proj.weight_scale": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.150.gate_proj.weight": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.150.gate_proj.weight_scale": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.150.up_proj.weight": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.150.up_proj.weight_scale": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.151.down_proj.weight": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.151.down_proj.weight_scale": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.151.gate_proj.weight": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.151.gate_proj.weight_scale": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.151.up_proj.weight": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.151.up_proj.weight_scale": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.152.down_proj.weight": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.152.down_proj.weight_scale": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.152.gate_proj.weight": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.152.gate_proj.weight_scale": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.152.up_proj.weight": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.152.up_proj.weight_scale": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.153.down_proj.weight": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.153.down_proj.weight_scale": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.153.gate_proj.weight": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.153.gate_proj.weight_scale": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.153.up_proj.weight": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.153.up_proj.weight_scale": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.154.down_proj.weight": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.154.down_proj.weight_scale": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.154.gate_proj.weight": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.154.gate_proj.weight_scale": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.154.up_proj.weight": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.154.up_proj.weight_scale": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.155.down_proj.weight": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.155.down_proj.weight_scale": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.155.gate_proj.weight": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.155.gate_proj.weight_scale": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.155.up_proj.weight": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.155.up_proj.weight_scale": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.156.down_proj.weight": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.156.down_proj.weight_scale": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.156.gate_proj.weight": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.156.gate_proj.weight_scale": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.156.up_proj.weight": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.156.up_proj.weight_scale": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.157.down_proj.weight": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.157.down_proj.weight_scale": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.157.gate_proj.weight": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.157.gate_proj.weight_scale": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.157.up_proj.weight": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.157.up_proj.weight_scale": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.158.down_proj.weight": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.158.down_proj.weight_scale": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.158.gate_proj.weight": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.158.gate_proj.weight_scale": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.158.up_proj.weight": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.158.up_proj.weight_scale": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.159.down_proj.weight": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.159.down_proj.weight_scale": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.159.gate_proj.weight": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.159.gate_proj.weight_scale": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.159.up_proj.weight": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.159.up_proj.weight_scale": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.16.down_proj.weight": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.16.down_proj.weight_scale": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.16.gate_proj.weight": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.16.gate_proj.weight_scale": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.16.up_proj.weight": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.16.up_proj.weight_scale": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.17.down_proj.weight": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.17.down_proj.weight_scale": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.17.gate_proj.weight": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.17.gate_proj.weight_scale": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.17.up_proj.weight": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.17.up_proj.weight_scale": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.18.down_proj.weight": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.18.down_proj.weight_scale": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.18.gate_proj.weight": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.18.gate_proj.weight_scale": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.18.up_proj.weight": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.18.up_proj.weight_scale": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.19.down_proj.weight": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.19.down_proj.weight_scale": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.19.gate_proj.weight": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.19.gate_proj.weight_scale": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.19.up_proj.weight": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.19.up_proj.weight_scale": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.2.down_proj.weight": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.2.down_proj.weight_scale": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.2.gate_proj.weight": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.2.gate_proj.weight_scale": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.2.up_proj.weight": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.2.up_proj.weight_scale": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.20.down_proj.weight": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.20.down_proj.weight_scale": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.20.gate_proj.weight": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.20.gate_proj.weight_scale": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.20.up_proj.weight": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.20.up_proj.weight_scale": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.21.down_proj.weight": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.21.down_proj.weight_scale": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.21.gate_proj.weight": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.21.gate_proj.weight_scale": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.21.up_proj.weight": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.21.up_proj.weight_scale": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.22.down_proj.weight": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.22.down_proj.weight_scale": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.22.gate_proj.weight": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.22.gate_proj.weight_scale": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.22.up_proj.weight": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.22.up_proj.weight_scale": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.23.down_proj.weight": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.23.down_proj.weight_scale": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.23.gate_proj.weight": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.23.gate_proj.weight_scale": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.23.up_proj.weight": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.23.up_proj.weight_scale": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.24.down_proj.weight": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.24.down_proj.weight_scale": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.24.gate_proj.weight": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.24.gate_proj.weight_scale": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.24.up_proj.weight": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.24.up_proj.weight_scale": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.25.down_proj.weight": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.25.down_proj.weight_scale": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.25.gate_proj.weight": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.25.gate_proj.weight_scale": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.25.up_proj.weight": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.25.up_proj.weight_scale": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.26.down_proj.weight": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.26.down_proj.weight_scale": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.26.gate_proj.weight": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.26.gate_proj.weight_scale": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.26.up_proj.weight": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.26.up_proj.weight_scale": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.27.down_proj.weight": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.27.down_proj.weight_scale": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.27.gate_proj.weight": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.27.gate_proj.weight_scale": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.27.up_proj.weight": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.27.up_proj.weight_scale": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.28.down_proj.weight": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.28.down_proj.weight_scale": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.28.gate_proj.weight": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.28.gate_proj.weight_scale": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.28.up_proj.weight": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.28.up_proj.weight_scale": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.29.down_proj.weight": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.29.down_proj.weight_scale": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.29.gate_proj.weight": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.29.gate_proj.weight_scale": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.29.up_proj.weight": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.29.up_proj.weight_scale": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.3.down_proj.weight": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.3.down_proj.weight_scale": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.3.gate_proj.weight": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.3.gate_proj.weight_scale": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.3.up_proj.weight": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.3.up_proj.weight_scale": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.30.down_proj.weight": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.30.down_proj.weight_scale": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.30.gate_proj.weight": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.30.gate_proj.weight_scale": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.30.up_proj.weight": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.30.up_proj.weight_scale": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.31.down_proj.weight": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.31.down_proj.weight_scale": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.31.gate_proj.weight": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.31.gate_proj.weight_scale": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.31.up_proj.weight": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.31.up_proj.weight_scale": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.32.down_proj.weight": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.32.down_proj.weight_scale": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.32.gate_proj.weight": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.32.gate_proj.weight_scale": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.32.up_proj.weight": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.32.up_proj.weight_scale": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.33.down_proj.weight": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.33.down_proj.weight_scale": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.33.gate_proj.weight": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.33.gate_proj.weight_scale": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.33.up_proj.weight": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.33.up_proj.weight_scale": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.34.down_proj.weight": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.34.down_proj.weight_scale": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.34.gate_proj.weight": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.34.gate_proj.weight_scale": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.34.up_proj.weight": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.34.up_proj.weight_scale": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.35.down_proj.weight": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.35.down_proj.weight_scale": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.35.gate_proj.weight": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.35.gate_proj.weight_scale": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.35.up_proj.weight": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.35.up_proj.weight_scale": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.36.down_proj.weight": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.36.down_proj.weight_scale": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.36.gate_proj.weight": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.36.gate_proj.weight_scale": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.36.up_proj.weight": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.36.up_proj.weight_scale": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.37.down_proj.weight": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.37.down_proj.weight_scale": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.37.gate_proj.weight": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.37.gate_proj.weight_scale": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.37.up_proj.weight": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.37.up_proj.weight_scale": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.38.down_proj.weight": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.38.down_proj.weight_scale": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.38.gate_proj.weight": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.38.gate_proj.weight_scale": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.38.up_proj.weight": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.38.up_proj.weight_scale": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.39.down_proj.weight": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.39.down_proj.weight_scale": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.39.gate_proj.weight": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.39.gate_proj.weight_scale": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.39.up_proj.weight": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.39.up_proj.weight_scale": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.4.down_proj.weight": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.4.down_proj.weight_scale": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.4.gate_proj.weight": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.4.gate_proj.weight_scale": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.4.up_proj.weight": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.4.up_proj.weight_scale": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.40.down_proj.weight": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.40.down_proj.weight_scale": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.40.gate_proj.weight": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.40.gate_proj.weight_scale": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.40.up_proj.weight": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.40.up_proj.weight_scale": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.41.down_proj.weight": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.41.down_proj.weight_scale": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.41.gate_proj.weight": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.41.gate_proj.weight_scale": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.41.up_proj.weight": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.41.up_proj.weight_scale": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.42.down_proj.weight": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.42.down_proj.weight_scale": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.42.gate_proj.weight": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.42.gate_proj.weight_scale": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.42.up_proj.weight": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.42.up_proj.weight_scale": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.43.down_proj.weight": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.43.down_proj.weight_scale": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.43.gate_proj.weight": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.43.gate_proj.weight_scale": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.43.up_proj.weight": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.43.up_proj.weight_scale": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.44.down_proj.weight": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.44.down_proj.weight_scale": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.44.gate_proj.weight": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.44.gate_proj.weight_scale": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.44.up_proj.weight": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.44.up_proj.weight_scale": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.45.down_proj.weight": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.45.down_proj.weight_scale": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.45.gate_proj.weight": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.45.gate_proj.weight_scale": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.45.up_proj.weight": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.45.up_proj.weight_scale": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.46.down_proj.weight": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.46.down_proj.weight_scale": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.46.gate_proj.weight": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.46.gate_proj.weight_scale": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.46.up_proj.weight": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.46.up_proj.weight_scale": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.47.down_proj.weight": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.47.down_proj.weight_scale": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.47.gate_proj.weight": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.47.gate_proj.weight_scale": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.47.up_proj.weight": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.47.up_proj.weight_scale": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.48.down_proj.weight": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.48.down_proj.weight_scale": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.48.gate_proj.weight": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.48.gate_proj.weight_scale": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.48.up_proj.weight": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.48.up_proj.weight_scale": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.49.down_proj.weight": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.49.down_proj.weight_scale": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.49.gate_proj.weight": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.49.gate_proj.weight_scale": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.49.up_proj.weight": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.49.up_proj.weight_scale": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.5.down_proj.weight": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.5.down_proj.weight_scale": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.5.gate_proj.weight": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.5.gate_proj.weight_scale": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.5.up_proj.weight": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.5.up_proj.weight_scale": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.50.down_proj.weight": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.50.down_proj.weight_scale": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.50.gate_proj.weight": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.50.gate_proj.weight_scale": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.50.up_proj.weight": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.50.up_proj.weight_scale": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.51.down_proj.weight": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.51.down_proj.weight_scale": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.51.gate_proj.weight": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.51.gate_proj.weight_scale": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.51.up_proj.weight": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.51.up_proj.weight_scale": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.52.down_proj.weight": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.52.down_proj.weight_scale": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.52.gate_proj.weight": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.52.gate_proj.weight_scale": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.52.up_proj.weight": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.52.up_proj.weight_scale": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.53.down_proj.weight": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.53.down_proj.weight_scale": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.53.gate_proj.weight": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.53.gate_proj.weight_scale": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.53.up_proj.weight": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.53.up_proj.weight_scale": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.54.down_proj.weight": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.54.down_proj.weight_scale": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.54.gate_proj.weight": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.54.gate_proj.weight_scale": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.54.up_proj.weight": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.54.up_proj.weight_scale": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.55.down_proj.weight": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.55.down_proj.weight_scale": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.55.gate_proj.weight": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.55.gate_proj.weight_scale": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.55.up_proj.weight": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.55.up_proj.weight_scale": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.56.down_proj.weight": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.56.down_proj.weight_scale": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.56.gate_proj.weight": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.56.gate_proj.weight_scale": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.56.up_proj.weight": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.56.up_proj.weight_scale": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.57.down_proj.weight": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.57.down_proj.weight_scale": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.57.gate_proj.weight": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.57.gate_proj.weight_scale": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.57.up_proj.weight": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.57.up_proj.weight_scale": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.58.down_proj.weight": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.58.down_proj.weight_scale": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.58.gate_proj.weight": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.58.gate_proj.weight_scale": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.58.up_proj.weight": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.58.up_proj.weight_scale": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.59.down_proj.weight": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.59.down_proj.weight_scale": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.59.gate_proj.weight": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.59.gate_proj.weight_scale": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.59.up_proj.weight": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.59.up_proj.weight_scale": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.6.down_proj.weight": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.6.down_proj.weight_scale": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.6.gate_proj.weight": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.6.gate_proj.weight_scale": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.6.up_proj.weight": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.6.up_proj.weight_scale": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.60.down_proj.weight": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.60.down_proj.weight_scale": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.60.gate_proj.weight": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.60.gate_proj.weight_scale": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.60.up_proj.weight": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.60.up_proj.weight_scale": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.61.down_proj.weight": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.61.down_proj.weight_scale": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.61.gate_proj.weight": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.61.gate_proj.weight_scale": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.61.up_proj.weight": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.61.up_proj.weight_scale": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.62.down_proj.weight": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.62.down_proj.weight_scale": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.62.gate_proj.weight": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.62.gate_proj.weight_scale": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.62.up_proj.weight": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.62.up_proj.weight_scale": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.63.down_proj.weight": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.63.down_proj.weight_scale": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.63.gate_proj.weight": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.63.gate_proj.weight_scale": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.63.up_proj.weight": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.63.up_proj.weight_scale": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.64.down_proj.weight": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.64.down_proj.weight_scale": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.64.gate_proj.weight": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.64.gate_proj.weight_scale": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.64.up_proj.weight": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.64.up_proj.weight_scale": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.65.down_proj.weight": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.65.down_proj.weight_scale": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.65.gate_proj.weight": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.65.gate_proj.weight_scale": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.65.up_proj.weight": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.65.up_proj.weight_scale": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.66.down_proj.weight": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.66.down_proj.weight_scale": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.66.gate_proj.weight": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.66.gate_proj.weight_scale": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.66.up_proj.weight": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.66.up_proj.weight_scale": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.67.down_proj.weight": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.67.down_proj.weight_scale": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.67.gate_proj.weight": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.67.gate_proj.weight_scale": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.67.up_proj.weight": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.67.up_proj.weight_scale": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.68.down_proj.weight": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.68.down_proj.weight_scale": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.68.gate_proj.weight": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.68.gate_proj.weight_scale": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.68.up_proj.weight": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.68.up_proj.weight_scale": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.69.down_proj.weight": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.69.down_proj.weight_scale": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.69.gate_proj.weight": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.69.gate_proj.weight_scale": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.69.up_proj.weight": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.69.up_proj.weight_scale": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.7.down_proj.weight": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.7.down_proj.weight_scale": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.7.gate_proj.weight": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.7.gate_proj.weight_scale": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.7.up_proj.weight": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.7.up_proj.weight_scale": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.70.down_proj.weight": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.70.down_proj.weight_scale": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.70.gate_proj.weight": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.70.gate_proj.weight_scale": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.70.up_proj.weight": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.70.up_proj.weight_scale": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.71.down_proj.weight": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.71.down_proj.weight_scale": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.71.gate_proj.weight": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.71.gate_proj.weight_scale": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.71.up_proj.weight": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.71.up_proj.weight_scale": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.72.down_proj.weight": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.72.down_proj.weight_scale": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.72.gate_proj.weight": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.72.gate_proj.weight_scale": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.72.up_proj.weight": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.72.up_proj.weight_scale": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.73.down_proj.weight": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.73.down_proj.weight_scale": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.73.gate_proj.weight": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.73.gate_proj.weight_scale": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.73.up_proj.weight": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.73.up_proj.weight_scale": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.74.down_proj.weight": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.74.down_proj.weight_scale": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.74.gate_proj.weight": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.74.gate_proj.weight_scale": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.74.up_proj.weight": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.74.up_proj.weight_scale": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.75.down_proj.weight": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.75.down_proj.weight_scale": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.75.gate_proj.weight": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.75.gate_proj.weight_scale": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.75.up_proj.weight": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.75.up_proj.weight_scale": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.76.down_proj.weight": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.76.down_proj.weight_scale": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.76.gate_proj.weight": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.76.gate_proj.weight_scale": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.76.up_proj.weight": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.76.up_proj.weight_scale": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.77.down_proj.weight": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.77.down_proj.weight_scale": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.77.gate_proj.weight": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.77.gate_proj.weight_scale": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.77.up_proj.weight": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.77.up_proj.weight_scale": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.78.down_proj.weight": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.78.down_proj.weight_scale": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.78.gate_proj.weight": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.78.gate_proj.weight_scale": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.78.up_proj.weight": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.78.up_proj.weight_scale": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.79.down_proj.weight": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.79.down_proj.weight_scale": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.79.gate_proj.weight": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.79.gate_proj.weight_scale": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.79.up_proj.weight": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.79.up_proj.weight_scale": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.8.down_proj.weight": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.8.down_proj.weight_scale": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.8.gate_proj.weight": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.8.gate_proj.weight_scale": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.8.up_proj.weight": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.8.up_proj.weight_scale": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.80.down_proj.weight": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.80.down_proj.weight_scale": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.80.gate_proj.weight": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.80.gate_proj.weight_scale": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.80.up_proj.weight": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.80.up_proj.weight_scale": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.81.down_proj.weight": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.81.down_proj.weight_scale": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.81.gate_proj.weight": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.81.gate_proj.weight_scale": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.81.up_proj.weight": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.81.up_proj.weight_scale": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.82.down_proj.weight": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.82.down_proj.weight_scale": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.82.gate_proj.weight": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.82.gate_proj.weight_scale": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.82.up_proj.weight": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.82.up_proj.weight_scale": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.83.down_proj.weight": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.83.down_proj.weight_scale": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.83.gate_proj.weight": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.83.gate_proj.weight_scale": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.83.up_proj.weight": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.83.up_proj.weight_scale": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.84.down_proj.weight": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.84.down_proj.weight_scale": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.84.gate_proj.weight": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.84.gate_proj.weight_scale": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.84.up_proj.weight": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.84.up_proj.weight_scale": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.85.down_proj.weight": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.85.down_proj.weight_scale": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.85.gate_proj.weight": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.85.gate_proj.weight_scale": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.85.up_proj.weight": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.85.up_proj.weight_scale": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.86.down_proj.weight": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.86.down_proj.weight_scale": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.86.gate_proj.weight": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.86.gate_proj.weight_scale": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.86.up_proj.weight": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.86.up_proj.weight_scale": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.87.down_proj.weight": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.87.down_proj.weight_scale": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.87.gate_proj.weight": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.87.gate_proj.weight_scale": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.87.up_proj.weight": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.87.up_proj.weight_scale": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.88.down_proj.weight": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.88.down_proj.weight_scale": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.88.gate_proj.weight": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.88.gate_proj.weight_scale": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.88.up_proj.weight": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.88.up_proj.weight_scale": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.89.down_proj.weight": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.89.down_proj.weight_scale": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.89.gate_proj.weight": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.89.gate_proj.weight_scale": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.89.up_proj.weight": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.89.up_proj.weight_scale": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.9.down_proj.weight": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.9.down_proj.weight_scale": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.9.gate_proj.weight": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.9.gate_proj.weight_scale": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.9.up_proj.weight": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.9.up_proj.weight_scale": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.90.down_proj.weight": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.90.down_proj.weight_scale": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.90.gate_proj.weight": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.90.gate_proj.weight_scale": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.90.up_proj.weight": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.90.up_proj.weight_scale": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.91.down_proj.weight": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.91.down_proj.weight_scale": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.91.gate_proj.weight": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.91.gate_proj.weight_scale": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.91.up_proj.weight": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.91.up_proj.weight_scale": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.92.down_proj.weight": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.92.down_proj.weight_scale": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.92.gate_proj.weight": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.92.gate_proj.weight_scale": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.92.up_proj.weight": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.92.up_proj.weight_scale": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.93.down_proj.weight": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.93.down_proj.weight_scale": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.93.gate_proj.weight": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.93.gate_proj.weight_scale": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.93.up_proj.weight": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.93.up_proj.weight_scale": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.94.down_proj.weight": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.94.down_proj.weight_scale": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.94.gate_proj.weight": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.94.gate_proj.weight_scale": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.94.up_proj.weight": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.94.up_proj.weight_scale": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.95.down_proj.weight": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.95.down_proj.weight_scale": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.95.gate_proj.weight": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.95.gate_proj.weight_scale": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.95.up_proj.weight": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.95.up_proj.weight_scale": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.96.down_proj.weight": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.96.down_proj.weight_scale": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.96.gate_proj.weight": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.96.gate_proj.weight_scale": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.96.up_proj.weight": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.96.up_proj.weight_scale": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.97.down_proj.weight": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.97.down_proj.weight_scale": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.97.gate_proj.weight": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.97.gate_proj.weight_scale": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.97.up_proj.weight": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.97.up_proj.weight_scale": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.98.down_proj.weight": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.98.down_proj.weight_scale": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.98.gate_proj.weight": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.98.gate_proj.weight_scale": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.98.up_proj.weight": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.98.up_proj.weight_scale": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.99.down_proj.weight": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.99.down_proj.weight_scale": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.99.gate_proj.weight": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.99.gate_proj.weight_scale": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.99.up_proj.weight": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.99.up_proj.weight_scale": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.gate.e_score_correction_bias": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.gate.weight": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.shared_experts.down_proj.weight": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.shared_experts.down_proj.weight_scale": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.shared_experts.gate_proj.weight": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.shared_experts.gate_proj.weight_scale": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.shared_experts.up_proj.weight": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.shared_experts.up_proj.weight_scale": "model-00008-of-00092.safetensors",
+ "model.layers.7.post_attention_layernorm.weight": "model-00008-of-00092.safetensors",
+ "model.layers.7.self_attn.k_norm.weight": "model-00008-of-00092.safetensors",
+ "model.layers.7.self_attn.k_proj.bias": "model-00008-of-00092.safetensors",
+ "model.layers.7.self_attn.k_proj.weight": "model-00008-of-00092.safetensors",
+ "model.layers.7.self_attn.k_proj.weight_scale": "model-00008-of-00092.safetensors",
+ "model.layers.7.self_attn.o_proj.weight": "model-00008-of-00092.safetensors",
+ "model.layers.7.self_attn.o_proj.weight_scale": "model-00008-of-00092.safetensors",
+ "model.layers.7.self_attn.q_norm.weight": "model-00008-of-00092.safetensors",
+ "model.layers.7.self_attn.q_proj.bias": "model-00008-of-00092.safetensors",
+ "model.layers.7.self_attn.q_proj.weight": "model-00008-of-00092.safetensors",
+ "model.layers.7.self_attn.q_proj.weight_scale": "model-00008-of-00092.safetensors",
+ "model.layers.7.self_attn.v_proj.bias": "model-00008-of-00092.safetensors",
+ "model.layers.7.self_attn.v_proj.weight": "model-00008-of-00092.safetensors",
+ "model.layers.7.self_attn.v_proj.weight_scale": "model-00008-of-00092.safetensors",
+ "model.layers.8.input_layernorm.weight": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.0.down_proj.weight": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.0.down_proj.weight_scale": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.0.gate_proj.weight": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.0.gate_proj.weight_scale": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.0.up_proj.weight": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.0.up_proj.weight_scale": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.1.down_proj.weight": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.1.down_proj.weight_scale": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.1.gate_proj.weight": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.1.gate_proj.weight_scale": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.1.up_proj.weight": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.1.up_proj.weight_scale": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.10.down_proj.weight": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.10.down_proj.weight_scale": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.10.gate_proj.weight": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.10.gate_proj.weight_scale": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.10.up_proj.weight": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.10.up_proj.weight_scale": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.100.down_proj.weight": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.100.down_proj.weight_scale": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.100.gate_proj.weight": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.100.gate_proj.weight_scale": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.100.up_proj.weight": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.100.up_proj.weight_scale": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.101.down_proj.weight": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.101.down_proj.weight_scale": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.101.gate_proj.weight": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.101.gate_proj.weight_scale": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.101.up_proj.weight": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.101.up_proj.weight_scale": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.102.down_proj.weight": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.102.down_proj.weight_scale": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.102.gate_proj.weight": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.102.gate_proj.weight_scale": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.102.up_proj.weight": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.102.up_proj.weight_scale": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.103.down_proj.weight": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.103.down_proj.weight_scale": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.103.gate_proj.weight": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.103.gate_proj.weight_scale": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.103.up_proj.weight": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.103.up_proj.weight_scale": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.104.down_proj.weight": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.104.down_proj.weight_scale": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.104.gate_proj.weight": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.104.gate_proj.weight_scale": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.104.up_proj.weight": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.104.up_proj.weight_scale": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.105.down_proj.weight": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.105.down_proj.weight_scale": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.105.gate_proj.weight": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.105.gate_proj.weight_scale": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.105.up_proj.weight": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.105.up_proj.weight_scale": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.106.down_proj.weight": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.106.down_proj.weight_scale": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.106.gate_proj.weight": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.106.gate_proj.weight_scale": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.106.up_proj.weight": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.106.up_proj.weight_scale": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.107.down_proj.weight": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.107.down_proj.weight_scale": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.107.gate_proj.weight": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.107.gate_proj.weight_scale": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.107.up_proj.weight": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.107.up_proj.weight_scale": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.108.down_proj.weight": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.108.down_proj.weight_scale": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.108.gate_proj.weight": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.108.gate_proj.weight_scale": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.108.up_proj.weight": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.108.up_proj.weight_scale": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.109.down_proj.weight": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.109.down_proj.weight_scale": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.109.gate_proj.weight": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.109.gate_proj.weight_scale": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.109.up_proj.weight": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.109.up_proj.weight_scale": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.11.down_proj.weight": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.11.down_proj.weight_scale": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.11.gate_proj.weight": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.11.gate_proj.weight_scale": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.11.up_proj.weight": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.11.up_proj.weight_scale": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.110.down_proj.weight": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.110.down_proj.weight_scale": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.110.gate_proj.weight": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.110.gate_proj.weight_scale": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.110.up_proj.weight": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.110.up_proj.weight_scale": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.111.down_proj.weight": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.111.down_proj.weight_scale": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.111.gate_proj.weight": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.111.gate_proj.weight_scale": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.111.up_proj.weight": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.111.up_proj.weight_scale": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.112.down_proj.weight": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.112.down_proj.weight_scale": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.112.gate_proj.weight": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.112.gate_proj.weight_scale": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.112.up_proj.weight": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.112.up_proj.weight_scale": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.113.down_proj.weight": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.113.down_proj.weight_scale": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.113.gate_proj.weight": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.113.gate_proj.weight_scale": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.113.up_proj.weight": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.113.up_proj.weight_scale": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.114.down_proj.weight": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.114.down_proj.weight_scale": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.114.gate_proj.weight": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.114.gate_proj.weight_scale": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.114.up_proj.weight": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.114.up_proj.weight_scale": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.115.down_proj.weight": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.115.down_proj.weight_scale": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.115.gate_proj.weight": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.115.gate_proj.weight_scale": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.115.up_proj.weight": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.115.up_proj.weight_scale": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.116.down_proj.weight": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.116.down_proj.weight_scale": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.116.gate_proj.weight": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.116.gate_proj.weight_scale": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.116.up_proj.weight": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.116.up_proj.weight_scale": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.117.down_proj.weight": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.117.down_proj.weight_scale": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.117.gate_proj.weight": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.117.gate_proj.weight_scale": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.117.up_proj.weight": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.117.up_proj.weight_scale": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.118.down_proj.weight": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.118.down_proj.weight_scale": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.118.gate_proj.weight": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.118.gate_proj.weight_scale": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.118.up_proj.weight": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.118.up_proj.weight_scale": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.119.down_proj.weight": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.119.down_proj.weight_scale": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.119.gate_proj.weight": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.119.gate_proj.weight_scale": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.119.up_proj.weight": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.119.up_proj.weight_scale": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.12.down_proj.weight": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.12.down_proj.weight_scale": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.12.gate_proj.weight": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.12.gate_proj.weight_scale": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.12.up_proj.weight": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.12.up_proj.weight_scale": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.120.down_proj.weight": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.120.down_proj.weight_scale": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.120.gate_proj.weight": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.120.gate_proj.weight_scale": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.120.up_proj.weight": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.120.up_proj.weight_scale": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.121.down_proj.weight": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.121.down_proj.weight_scale": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.121.gate_proj.weight": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.121.gate_proj.weight_scale": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.121.up_proj.weight": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.121.up_proj.weight_scale": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.122.down_proj.weight": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.122.down_proj.weight_scale": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.122.gate_proj.weight": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.122.gate_proj.weight_scale": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.122.up_proj.weight": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.122.up_proj.weight_scale": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.123.down_proj.weight": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.123.down_proj.weight_scale": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.123.gate_proj.weight": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.123.gate_proj.weight_scale": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.123.up_proj.weight": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.123.up_proj.weight_scale": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.124.down_proj.weight": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.124.down_proj.weight_scale": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.124.gate_proj.weight": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.124.gate_proj.weight_scale": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.124.up_proj.weight": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.124.up_proj.weight_scale": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.125.down_proj.weight": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.125.down_proj.weight_scale": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.125.gate_proj.weight": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.125.gate_proj.weight_scale": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.125.up_proj.weight": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.125.up_proj.weight_scale": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.126.down_proj.weight": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.126.down_proj.weight_scale": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.126.gate_proj.weight": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.126.gate_proj.weight_scale": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.126.up_proj.weight": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.126.up_proj.weight_scale": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.127.down_proj.weight": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.127.down_proj.weight_scale": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.127.gate_proj.weight": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.127.gate_proj.weight_scale": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.127.up_proj.weight": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.127.up_proj.weight_scale": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.128.down_proj.weight": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.128.down_proj.weight_scale": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.128.gate_proj.weight": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.128.gate_proj.weight_scale": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.128.up_proj.weight": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.128.up_proj.weight_scale": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.129.down_proj.weight": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.129.down_proj.weight_scale": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.129.gate_proj.weight": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.129.gate_proj.weight_scale": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.129.up_proj.weight": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.129.up_proj.weight_scale": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.13.down_proj.weight": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.13.down_proj.weight_scale": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.13.gate_proj.weight": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.13.gate_proj.weight_scale": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.13.up_proj.weight": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.13.up_proj.weight_scale": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.130.down_proj.weight": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.130.down_proj.weight_scale": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.130.gate_proj.weight": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.130.gate_proj.weight_scale": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.130.up_proj.weight": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.130.up_proj.weight_scale": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.131.down_proj.weight": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.131.down_proj.weight_scale": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.131.gate_proj.weight": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.131.gate_proj.weight_scale": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.131.up_proj.weight": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.131.up_proj.weight_scale": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.132.down_proj.weight": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.132.down_proj.weight_scale": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.132.gate_proj.weight": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.132.gate_proj.weight_scale": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.132.up_proj.weight": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.132.up_proj.weight_scale": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.133.down_proj.weight": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.133.down_proj.weight_scale": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.133.gate_proj.weight": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.133.gate_proj.weight_scale": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.133.up_proj.weight": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.133.up_proj.weight_scale": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.134.down_proj.weight": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.134.down_proj.weight_scale": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.134.gate_proj.weight": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.134.gate_proj.weight_scale": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.134.up_proj.weight": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.134.up_proj.weight_scale": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.135.down_proj.weight": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.135.down_proj.weight_scale": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.135.gate_proj.weight": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.135.gate_proj.weight_scale": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.135.up_proj.weight": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.135.up_proj.weight_scale": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.136.down_proj.weight": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.136.down_proj.weight_scale": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.136.gate_proj.weight": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.136.gate_proj.weight_scale": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.136.up_proj.weight": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.136.up_proj.weight_scale": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.137.down_proj.weight": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.137.down_proj.weight_scale": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.137.gate_proj.weight": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.137.gate_proj.weight_scale": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.137.up_proj.weight": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.137.up_proj.weight_scale": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.138.down_proj.weight": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.138.down_proj.weight_scale": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.138.gate_proj.weight": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.138.gate_proj.weight_scale": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.138.up_proj.weight": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.138.up_proj.weight_scale": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.139.down_proj.weight": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.139.down_proj.weight_scale": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.139.gate_proj.weight": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.139.gate_proj.weight_scale": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.139.up_proj.weight": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.139.up_proj.weight_scale": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.14.down_proj.weight": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.14.down_proj.weight_scale": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.14.gate_proj.weight": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.14.gate_proj.weight_scale": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.14.up_proj.weight": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.14.up_proj.weight_scale": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.140.down_proj.weight": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.140.down_proj.weight_scale": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.140.gate_proj.weight": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.140.gate_proj.weight_scale": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.140.up_proj.weight": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.140.up_proj.weight_scale": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.141.down_proj.weight": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.141.down_proj.weight_scale": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.141.gate_proj.weight": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.141.gate_proj.weight_scale": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.141.up_proj.weight": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.141.up_proj.weight_scale": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.142.down_proj.weight": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.142.down_proj.weight_scale": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.142.gate_proj.weight": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.142.gate_proj.weight_scale": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.142.up_proj.weight": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.142.up_proj.weight_scale": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.143.down_proj.weight": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.143.down_proj.weight_scale": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.143.gate_proj.weight": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.143.gate_proj.weight_scale": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.143.up_proj.weight": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.143.up_proj.weight_scale": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.144.down_proj.weight": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.144.down_proj.weight_scale": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.144.gate_proj.weight": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.144.gate_proj.weight_scale": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.144.up_proj.weight": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.144.up_proj.weight_scale": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.145.down_proj.weight": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.145.down_proj.weight_scale": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.145.gate_proj.weight": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.145.gate_proj.weight_scale": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.145.up_proj.weight": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.145.up_proj.weight_scale": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.146.down_proj.weight": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.146.down_proj.weight_scale": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.146.gate_proj.weight": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.146.gate_proj.weight_scale": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.146.up_proj.weight": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.146.up_proj.weight_scale": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.147.down_proj.weight": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.147.down_proj.weight_scale": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.147.gate_proj.weight": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.147.gate_proj.weight_scale": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.147.up_proj.weight": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.147.up_proj.weight_scale": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.148.down_proj.weight": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.148.down_proj.weight_scale": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.148.gate_proj.weight": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.148.gate_proj.weight_scale": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.148.up_proj.weight": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.148.up_proj.weight_scale": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.149.down_proj.weight": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.149.down_proj.weight_scale": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.149.gate_proj.weight": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.149.gate_proj.weight_scale": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.149.up_proj.weight": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.149.up_proj.weight_scale": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.15.down_proj.weight": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.15.down_proj.weight_scale": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.15.gate_proj.weight": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.15.gate_proj.weight_scale": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.15.up_proj.weight": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.15.up_proj.weight_scale": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.150.down_proj.weight": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.150.down_proj.weight_scale": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.150.gate_proj.weight": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.150.gate_proj.weight_scale": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.150.up_proj.weight": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.150.up_proj.weight_scale": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.151.down_proj.weight": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.151.down_proj.weight_scale": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.151.gate_proj.weight": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.151.gate_proj.weight_scale": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.151.up_proj.weight": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.151.up_proj.weight_scale": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.152.down_proj.weight": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.152.down_proj.weight_scale": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.152.gate_proj.weight": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.152.gate_proj.weight_scale": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.152.up_proj.weight": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.152.up_proj.weight_scale": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.153.down_proj.weight": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.153.down_proj.weight_scale": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.153.gate_proj.weight": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.153.gate_proj.weight_scale": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.153.up_proj.weight": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.153.up_proj.weight_scale": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.154.down_proj.weight": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.154.down_proj.weight_scale": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.154.gate_proj.weight": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.154.gate_proj.weight_scale": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.154.up_proj.weight": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.154.up_proj.weight_scale": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.155.down_proj.weight": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.155.down_proj.weight_scale": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.155.gate_proj.weight": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.155.gate_proj.weight_scale": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.155.up_proj.weight": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.155.up_proj.weight_scale": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.156.down_proj.weight": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.156.down_proj.weight_scale": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.156.gate_proj.weight": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.156.gate_proj.weight_scale": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.156.up_proj.weight": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.156.up_proj.weight_scale": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.157.down_proj.weight": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.157.down_proj.weight_scale": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.157.gate_proj.weight": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.157.gate_proj.weight_scale": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.157.up_proj.weight": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.157.up_proj.weight_scale": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.158.down_proj.weight": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.158.down_proj.weight_scale": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.158.gate_proj.weight": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.158.gate_proj.weight_scale": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.158.up_proj.weight": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.158.up_proj.weight_scale": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.159.down_proj.weight": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.159.down_proj.weight_scale": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.159.gate_proj.weight": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.159.gate_proj.weight_scale": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.159.up_proj.weight": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.159.up_proj.weight_scale": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.16.down_proj.weight": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.16.down_proj.weight_scale": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.16.gate_proj.weight": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.16.gate_proj.weight_scale": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.16.up_proj.weight": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.16.up_proj.weight_scale": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.17.down_proj.weight": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.17.down_proj.weight_scale": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.17.gate_proj.weight": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.17.gate_proj.weight_scale": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.17.up_proj.weight": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.17.up_proj.weight_scale": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.18.down_proj.weight": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.18.down_proj.weight_scale": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.18.gate_proj.weight": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.18.gate_proj.weight_scale": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.18.up_proj.weight": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.18.up_proj.weight_scale": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.19.down_proj.weight": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.19.down_proj.weight_scale": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.19.gate_proj.weight": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.19.gate_proj.weight_scale": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.19.up_proj.weight": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.19.up_proj.weight_scale": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.2.down_proj.weight": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.2.down_proj.weight_scale": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.2.gate_proj.weight": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.2.gate_proj.weight_scale": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.2.up_proj.weight": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.2.up_proj.weight_scale": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.20.down_proj.weight": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.20.down_proj.weight_scale": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.20.gate_proj.weight": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.20.gate_proj.weight_scale": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.20.up_proj.weight": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.20.up_proj.weight_scale": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.21.down_proj.weight": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.21.down_proj.weight_scale": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.21.gate_proj.weight": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.21.gate_proj.weight_scale": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.21.up_proj.weight": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.21.up_proj.weight_scale": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.22.down_proj.weight": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.22.down_proj.weight_scale": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.22.gate_proj.weight": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.22.gate_proj.weight_scale": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.22.up_proj.weight": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.22.up_proj.weight_scale": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.23.down_proj.weight": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.23.down_proj.weight_scale": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.23.gate_proj.weight": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.23.gate_proj.weight_scale": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.23.up_proj.weight": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.23.up_proj.weight_scale": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.24.down_proj.weight": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.24.down_proj.weight_scale": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.24.gate_proj.weight": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.24.gate_proj.weight_scale": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.24.up_proj.weight": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.24.up_proj.weight_scale": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.25.down_proj.weight": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.25.down_proj.weight_scale": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.25.gate_proj.weight": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.25.gate_proj.weight_scale": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.25.up_proj.weight": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.25.up_proj.weight_scale": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.26.down_proj.weight": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.26.down_proj.weight_scale": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.26.gate_proj.weight": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.26.gate_proj.weight_scale": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.26.up_proj.weight": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.26.up_proj.weight_scale": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.27.down_proj.weight": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.27.down_proj.weight_scale": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.27.gate_proj.weight": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.27.gate_proj.weight_scale": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.27.up_proj.weight": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.27.up_proj.weight_scale": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.28.down_proj.weight": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.28.down_proj.weight_scale": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.28.gate_proj.weight": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.28.gate_proj.weight_scale": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.28.up_proj.weight": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.28.up_proj.weight_scale": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.29.down_proj.weight": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.29.down_proj.weight_scale": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.29.gate_proj.weight": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.29.gate_proj.weight_scale": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.29.up_proj.weight": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.29.up_proj.weight_scale": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.3.down_proj.weight": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.3.down_proj.weight_scale": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.3.gate_proj.weight": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.3.gate_proj.weight_scale": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.3.up_proj.weight": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.3.up_proj.weight_scale": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.30.down_proj.weight": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.30.down_proj.weight_scale": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.30.gate_proj.weight": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.30.gate_proj.weight_scale": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.30.up_proj.weight": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.30.up_proj.weight_scale": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.31.down_proj.weight": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.31.down_proj.weight_scale": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.31.gate_proj.weight": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.31.gate_proj.weight_scale": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.31.up_proj.weight": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.31.up_proj.weight_scale": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.32.down_proj.weight": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.32.down_proj.weight_scale": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.32.gate_proj.weight": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.32.gate_proj.weight_scale": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.32.up_proj.weight": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.32.up_proj.weight_scale": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.33.down_proj.weight": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.33.down_proj.weight_scale": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.33.gate_proj.weight": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.33.gate_proj.weight_scale": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.33.up_proj.weight": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.33.up_proj.weight_scale": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.34.down_proj.weight": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.34.down_proj.weight_scale": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.34.gate_proj.weight": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.34.gate_proj.weight_scale": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.34.up_proj.weight": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.34.up_proj.weight_scale": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.35.down_proj.weight": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.35.down_proj.weight_scale": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.35.gate_proj.weight": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.35.gate_proj.weight_scale": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.35.up_proj.weight": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.35.up_proj.weight_scale": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.36.down_proj.weight": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.36.down_proj.weight_scale": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.36.gate_proj.weight": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.36.gate_proj.weight_scale": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.36.up_proj.weight": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.36.up_proj.weight_scale": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.37.down_proj.weight": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.37.down_proj.weight_scale": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.37.gate_proj.weight": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.37.gate_proj.weight_scale": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.37.up_proj.weight": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.37.up_proj.weight_scale": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.38.down_proj.weight": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.38.down_proj.weight_scale": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.38.gate_proj.weight": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.38.gate_proj.weight_scale": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.38.up_proj.weight": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.38.up_proj.weight_scale": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.39.down_proj.weight": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.39.down_proj.weight_scale": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.39.gate_proj.weight": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.39.gate_proj.weight_scale": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.39.up_proj.weight": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.39.up_proj.weight_scale": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.4.down_proj.weight": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.4.down_proj.weight_scale": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.4.gate_proj.weight": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.4.gate_proj.weight_scale": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.4.up_proj.weight": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.4.up_proj.weight_scale": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.40.down_proj.weight": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.40.down_proj.weight_scale": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.40.gate_proj.weight": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.40.gate_proj.weight_scale": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.40.up_proj.weight": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.40.up_proj.weight_scale": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.41.down_proj.weight": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.41.down_proj.weight_scale": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.41.gate_proj.weight": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.41.gate_proj.weight_scale": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.41.up_proj.weight": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.41.up_proj.weight_scale": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.42.down_proj.weight": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.42.down_proj.weight_scale": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.42.gate_proj.weight": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.42.gate_proj.weight_scale": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.42.up_proj.weight": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.42.up_proj.weight_scale": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.43.down_proj.weight": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.43.down_proj.weight_scale": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.43.gate_proj.weight": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.43.gate_proj.weight_scale": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.43.up_proj.weight": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.43.up_proj.weight_scale": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.44.down_proj.weight": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.44.down_proj.weight_scale": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.44.gate_proj.weight": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.44.gate_proj.weight_scale": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.44.up_proj.weight": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.44.up_proj.weight_scale": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.45.down_proj.weight": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.45.down_proj.weight_scale": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.45.gate_proj.weight": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.45.gate_proj.weight_scale": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.45.up_proj.weight": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.45.up_proj.weight_scale": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.46.down_proj.weight": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.46.down_proj.weight_scale": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.46.gate_proj.weight": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.46.gate_proj.weight_scale": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.46.up_proj.weight": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.46.up_proj.weight_scale": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.47.down_proj.weight": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.47.down_proj.weight_scale": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.47.gate_proj.weight": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.47.gate_proj.weight_scale": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.47.up_proj.weight": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.47.up_proj.weight_scale": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.48.down_proj.weight": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.48.down_proj.weight_scale": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.48.gate_proj.weight": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.48.gate_proj.weight_scale": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.48.up_proj.weight": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.48.up_proj.weight_scale": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.49.down_proj.weight": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.49.down_proj.weight_scale": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.49.gate_proj.weight": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.49.gate_proj.weight_scale": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.49.up_proj.weight": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.49.up_proj.weight_scale": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.5.down_proj.weight": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.5.down_proj.weight_scale": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.5.gate_proj.weight": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.5.gate_proj.weight_scale": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.5.up_proj.weight": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.5.up_proj.weight_scale": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.50.down_proj.weight": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.50.down_proj.weight_scale": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.50.gate_proj.weight": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.50.gate_proj.weight_scale": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.50.up_proj.weight": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.50.up_proj.weight_scale": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.51.down_proj.weight": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.51.down_proj.weight_scale": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.51.gate_proj.weight": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.51.gate_proj.weight_scale": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.51.up_proj.weight": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.51.up_proj.weight_scale": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.52.down_proj.weight": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.52.down_proj.weight_scale": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.52.gate_proj.weight": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.52.gate_proj.weight_scale": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.52.up_proj.weight": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.52.up_proj.weight_scale": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.53.down_proj.weight": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.53.down_proj.weight_scale": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.53.gate_proj.weight": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.53.gate_proj.weight_scale": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.53.up_proj.weight": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.53.up_proj.weight_scale": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.54.down_proj.weight": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.54.down_proj.weight_scale": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.54.gate_proj.weight": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.54.gate_proj.weight_scale": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.54.up_proj.weight": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.54.up_proj.weight_scale": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.55.down_proj.weight": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.55.down_proj.weight_scale": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.55.gate_proj.weight": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.55.gate_proj.weight_scale": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.55.up_proj.weight": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.55.up_proj.weight_scale": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.56.down_proj.weight": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.56.down_proj.weight_scale": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.56.gate_proj.weight": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.56.gate_proj.weight_scale": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.56.up_proj.weight": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.56.up_proj.weight_scale": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.57.down_proj.weight": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.57.down_proj.weight_scale": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.57.gate_proj.weight": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.57.gate_proj.weight_scale": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.57.up_proj.weight": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.57.up_proj.weight_scale": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.58.down_proj.weight": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.58.down_proj.weight_scale": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.58.gate_proj.weight": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.58.gate_proj.weight_scale": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.58.up_proj.weight": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.58.up_proj.weight_scale": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.59.down_proj.weight": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.59.down_proj.weight_scale": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.59.gate_proj.weight": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.59.gate_proj.weight_scale": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.59.up_proj.weight": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.59.up_proj.weight_scale": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.6.down_proj.weight": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.6.down_proj.weight_scale": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.6.gate_proj.weight": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.6.gate_proj.weight_scale": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.6.up_proj.weight": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.6.up_proj.weight_scale": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.60.down_proj.weight": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.60.down_proj.weight_scale": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.60.gate_proj.weight": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.60.gate_proj.weight_scale": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.60.up_proj.weight": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.60.up_proj.weight_scale": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.61.down_proj.weight": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.61.down_proj.weight_scale": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.61.gate_proj.weight": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.61.gate_proj.weight_scale": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.61.up_proj.weight": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.61.up_proj.weight_scale": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.62.down_proj.weight": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.62.down_proj.weight_scale": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.62.gate_proj.weight": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.62.gate_proj.weight_scale": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.62.up_proj.weight": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.62.up_proj.weight_scale": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.63.down_proj.weight": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.63.down_proj.weight_scale": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.63.gate_proj.weight": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.63.gate_proj.weight_scale": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.63.up_proj.weight": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.63.up_proj.weight_scale": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.64.down_proj.weight": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.64.down_proj.weight_scale": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.64.gate_proj.weight": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.64.gate_proj.weight_scale": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.64.up_proj.weight": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.64.up_proj.weight_scale": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.65.down_proj.weight": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.65.down_proj.weight_scale": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.65.gate_proj.weight": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.65.gate_proj.weight_scale": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.65.up_proj.weight": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.65.up_proj.weight_scale": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.66.down_proj.weight": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.66.down_proj.weight_scale": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.66.gate_proj.weight": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.66.gate_proj.weight_scale": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.66.up_proj.weight": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.66.up_proj.weight_scale": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.67.down_proj.weight": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.67.down_proj.weight_scale": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.67.gate_proj.weight": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.67.gate_proj.weight_scale": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.67.up_proj.weight": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.67.up_proj.weight_scale": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.68.down_proj.weight": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.68.down_proj.weight_scale": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.68.gate_proj.weight": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.68.gate_proj.weight_scale": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.68.up_proj.weight": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.68.up_proj.weight_scale": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.69.down_proj.weight": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.69.down_proj.weight_scale": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.69.gate_proj.weight": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.69.gate_proj.weight_scale": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.69.up_proj.weight": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.69.up_proj.weight_scale": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.7.down_proj.weight": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.7.down_proj.weight_scale": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.7.gate_proj.weight": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.7.gate_proj.weight_scale": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.7.up_proj.weight": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.7.up_proj.weight_scale": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.70.down_proj.weight": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.70.down_proj.weight_scale": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.70.gate_proj.weight": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.70.gate_proj.weight_scale": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.70.up_proj.weight": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.70.up_proj.weight_scale": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.71.down_proj.weight": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.71.down_proj.weight_scale": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.71.gate_proj.weight": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.71.gate_proj.weight_scale": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.71.up_proj.weight": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.71.up_proj.weight_scale": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.72.down_proj.weight": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.72.down_proj.weight_scale": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.72.gate_proj.weight": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.72.gate_proj.weight_scale": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.72.up_proj.weight": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.72.up_proj.weight_scale": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.73.down_proj.weight": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.73.down_proj.weight_scale": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.73.gate_proj.weight": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.73.gate_proj.weight_scale": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.73.up_proj.weight": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.73.up_proj.weight_scale": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.74.down_proj.weight": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.74.down_proj.weight_scale": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.74.gate_proj.weight": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.74.gate_proj.weight_scale": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.74.up_proj.weight": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.74.up_proj.weight_scale": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.75.down_proj.weight": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.75.down_proj.weight_scale": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.75.gate_proj.weight": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.75.gate_proj.weight_scale": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.75.up_proj.weight": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.75.up_proj.weight_scale": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.76.down_proj.weight": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.76.down_proj.weight_scale": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.76.gate_proj.weight": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.76.gate_proj.weight_scale": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.76.up_proj.weight": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.76.up_proj.weight_scale": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.77.down_proj.weight": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.77.down_proj.weight_scale": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.77.gate_proj.weight": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.77.gate_proj.weight_scale": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.77.up_proj.weight": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.77.up_proj.weight_scale": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.78.down_proj.weight": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.78.down_proj.weight_scale": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.78.gate_proj.weight": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.78.gate_proj.weight_scale": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.78.up_proj.weight": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.78.up_proj.weight_scale": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.79.down_proj.weight": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.79.down_proj.weight_scale": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.79.gate_proj.weight": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.79.gate_proj.weight_scale": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.79.up_proj.weight": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.79.up_proj.weight_scale": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.8.down_proj.weight": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.8.down_proj.weight_scale": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.8.gate_proj.weight": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.8.gate_proj.weight_scale": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.8.up_proj.weight": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.8.up_proj.weight_scale": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.80.down_proj.weight": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.80.down_proj.weight_scale": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.80.gate_proj.weight": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.80.gate_proj.weight_scale": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.80.up_proj.weight": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.80.up_proj.weight_scale": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.81.down_proj.weight": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.81.down_proj.weight_scale": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.81.gate_proj.weight": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.81.gate_proj.weight_scale": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.81.up_proj.weight": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.81.up_proj.weight_scale": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.82.down_proj.weight": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.82.down_proj.weight_scale": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.82.gate_proj.weight": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.82.gate_proj.weight_scale": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.82.up_proj.weight": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.82.up_proj.weight_scale": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.83.down_proj.weight": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.83.down_proj.weight_scale": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.83.gate_proj.weight": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.83.gate_proj.weight_scale": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.83.up_proj.weight": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.83.up_proj.weight_scale": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.84.down_proj.weight": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.84.down_proj.weight_scale": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.84.gate_proj.weight": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.84.gate_proj.weight_scale": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.84.up_proj.weight": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.84.up_proj.weight_scale": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.85.down_proj.weight": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.85.down_proj.weight_scale": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.85.gate_proj.weight": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.85.gate_proj.weight_scale": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.85.up_proj.weight": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.85.up_proj.weight_scale": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.86.down_proj.weight": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.86.down_proj.weight_scale": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.86.gate_proj.weight": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.86.gate_proj.weight_scale": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.86.up_proj.weight": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.86.up_proj.weight_scale": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.87.down_proj.weight": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.87.down_proj.weight_scale": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.87.gate_proj.weight": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.87.gate_proj.weight_scale": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.87.up_proj.weight": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.87.up_proj.weight_scale": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.88.down_proj.weight": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.88.down_proj.weight_scale": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.88.gate_proj.weight": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.88.gate_proj.weight_scale": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.88.up_proj.weight": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.88.up_proj.weight_scale": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.89.down_proj.weight": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.89.down_proj.weight_scale": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.89.gate_proj.weight": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.89.gate_proj.weight_scale": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.89.up_proj.weight": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.89.up_proj.weight_scale": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.9.down_proj.weight": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.9.down_proj.weight_scale": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.9.gate_proj.weight": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.9.gate_proj.weight_scale": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.9.up_proj.weight": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.9.up_proj.weight_scale": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.90.down_proj.weight": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.90.down_proj.weight_scale": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.90.gate_proj.weight": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.90.gate_proj.weight_scale": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.90.up_proj.weight": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.90.up_proj.weight_scale": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.91.down_proj.weight": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.91.down_proj.weight_scale": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.91.gate_proj.weight": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.91.gate_proj.weight_scale": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.91.up_proj.weight": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.91.up_proj.weight_scale": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.92.down_proj.weight": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.92.down_proj.weight_scale": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.92.gate_proj.weight": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.92.gate_proj.weight_scale": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.92.up_proj.weight": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.92.up_proj.weight_scale": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.93.down_proj.weight": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.93.down_proj.weight_scale": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.93.gate_proj.weight": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.93.gate_proj.weight_scale": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.93.up_proj.weight": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.93.up_proj.weight_scale": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.94.down_proj.weight": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.94.down_proj.weight_scale": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.94.gate_proj.weight": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.94.gate_proj.weight_scale": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.94.up_proj.weight": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.94.up_proj.weight_scale": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.95.down_proj.weight": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.95.down_proj.weight_scale": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.95.gate_proj.weight": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.95.gate_proj.weight_scale": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.95.up_proj.weight": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.95.up_proj.weight_scale": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.96.down_proj.weight": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.96.down_proj.weight_scale": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.96.gate_proj.weight": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.96.gate_proj.weight_scale": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.96.up_proj.weight": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.96.up_proj.weight_scale": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.97.down_proj.weight": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.97.down_proj.weight_scale": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.97.gate_proj.weight": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.97.gate_proj.weight_scale": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.97.up_proj.weight": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.97.up_proj.weight_scale": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.98.down_proj.weight": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.98.down_proj.weight_scale": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.98.gate_proj.weight": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.98.gate_proj.weight_scale": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.98.up_proj.weight": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.98.up_proj.weight_scale": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.99.down_proj.weight": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.99.down_proj.weight_scale": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.99.gate_proj.weight": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.99.gate_proj.weight_scale": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.99.up_proj.weight": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.99.up_proj.weight_scale": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.gate.e_score_correction_bias": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.gate.weight": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.shared_experts.down_proj.weight": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.shared_experts.down_proj.weight_scale": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.shared_experts.gate_proj.weight": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.shared_experts.gate_proj.weight_scale": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.shared_experts.up_proj.weight": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.shared_experts.up_proj.weight_scale": "model-00009-of-00092.safetensors",
+ "model.layers.8.post_attention_layernorm.weight": "model-00009-of-00092.safetensors",
+ "model.layers.8.self_attn.k_norm.weight": "model-00009-of-00092.safetensors",
+ "model.layers.8.self_attn.k_proj.bias": "model-00009-of-00092.safetensors",
+ "model.layers.8.self_attn.k_proj.weight": "model-00009-of-00092.safetensors",
+ "model.layers.8.self_attn.k_proj.weight_scale": "model-00009-of-00092.safetensors",
+ "model.layers.8.self_attn.o_proj.weight": "model-00009-of-00092.safetensors",
+ "model.layers.8.self_attn.o_proj.weight_scale": "model-00009-of-00092.safetensors",
+ "model.layers.8.self_attn.q_norm.weight": "model-00009-of-00092.safetensors",
+ "model.layers.8.self_attn.q_proj.bias": "model-00009-of-00092.safetensors",
+ "model.layers.8.self_attn.q_proj.weight": "model-00009-of-00092.safetensors",
+ "model.layers.8.self_attn.q_proj.weight_scale": "model-00009-of-00092.safetensors",
+ "model.layers.8.self_attn.v_proj.bias": "model-00009-of-00092.safetensors",
+ "model.layers.8.self_attn.v_proj.weight": "model-00009-of-00092.safetensors",
+ "model.layers.8.self_attn.v_proj.weight_scale": "model-00009-of-00092.safetensors",
+ "model.layers.9.input_layernorm.weight": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.0.down_proj.weight": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.0.down_proj.weight_scale": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.0.gate_proj.weight": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.0.gate_proj.weight_scale": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.0.up_proj.weight": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.0.up_proj.weight_scale": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.1.down_proj.weight": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.1.down_proj.weight_scale": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.1.gate_proj.weight": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.1.gate_proj.weight_scale": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.1.up_proj.weight": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.1.up_proj.weight_scale": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.10.down_proj.weight": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.10.down_proj.weight_scale": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.10.gate_proj.weight": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.10.gate_proj.weight_scale": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.10.up_proj.weight": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.10.up_proj.weight_scale": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.100.down_proj.weight": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.100.down_proj.weight_scale": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.100.gate_proj.weight": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.100.gate_proj.weight_scale": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.100.up_proj.weight": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.100.up_proj.weight_scale": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.101.down_proj.weight": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.101.down_proj.weight_scale": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.101.gate_proj.weight": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.101.gate_proj.weight_scale": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.101.up_proj.weight": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.101.up_proj.weight_scale": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.102.down_proj.weight": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.102.down_proj.weight_scale": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.102.gate_proj.weight": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.102.gate_proj.weight_scale": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.102.up_proj.weight": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.102.up_proj.weight_scale": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.103.down_proj.weight": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.103.down_proj.weight_scale": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.103.gate_proj.weight": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.103.gate_proj.weight_scale": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.103.up_proj.weight": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.103.up_proj.weight_scale": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.104.down_proj.weight": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.104.down_proj.weight_scale": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.104.gate_proj.weight": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.104.gate_proj.weight_scale": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.104.up_proj.weight": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.104.up_proj.weight_scale": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.105.down_proj.weight": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.105.down_proj.weight_scale": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.105.gate_proj.weight": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.105.gate_proj.weight_scale": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.105.up_proj.weight": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.105.up_proj.weight_scale": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.106.down_proj.weight": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.106.down_proj.weight_scale": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.106.gate_proj.weight": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.106.gate_proj.weight_scale": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.106.up_proj.weight": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.106.up_proj.weight_scale": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.107.down_proj.weight": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.107.down_proj.weight_scale": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.107.gate_proj.weight": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.107.gate_proj.weight_scale": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.107.up_proj.weight": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.107.up_proj.weight_scale": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.108.down_proj.weight": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.108.down_proj.weight_scale": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.108.gate_proj.weight": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.108.gate_proj.weight_scale": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.108.up_proj.weight": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.108.up_proj.weight_scale": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.109.down_proj.weight": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.109.down_proj.weight_scale": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.109.gate_proj.weight": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.109.gate_proj.weight_scale": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.109.up_proj.weight": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.109.up_proj.weight_scale": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.11.down_proj.weight": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.11.down_proj.weight_scale": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.11.gate_proj.weight": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.11.gate_proj.weight_scale": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.11.up_proj.weight": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.11.up_proj.weight_scale": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.110.down_proj.weight": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.110.down_proj.weight_scale": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.110.gate_proj.weight": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.110.gate_proj.weight_scale": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.110.up_proj.weight": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.110.up_proj.weight_scale": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.111.down_proj.weight": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.111.down_proj.weight_scale": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.111.gate_proj.weight": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.111.gate_proj.weight_scale": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.111.up_proj.weight": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.111.up_proj.weight_scale": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.112.down_proj.weight": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.112.down_proj.weight_scale": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.112.gate_proj.weight": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.112.gate_proj.weight_scale": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.112.up_proj.weight": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.112.up_proj.weight_scale": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.113.down_proj.weight": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.113.down_proj.weight_scale": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.113.gate_proj.weight": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.113.gate_proj.weight_scale": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.113.up_proj.weight": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.113.up_proj.weight_scale": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.114.down_proj.weight": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.114.down_proj.weight_scale": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.114.gate_proj.weight": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.114.gate_proj.weight_scale": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.114.up_proj.weight": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.114.up_proj.weight_scale": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.115.down_proj.weight": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.115.down_proj.weight_scale": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.115.gate_proj.weight": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.115.gate_proj.weight_scale": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.115.up_proj.weight": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.115.up_proj.weight_scale": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.116.down_proj.weight": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.116.down_proj.weight_scale": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.116.gate_proj.weight": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.116.gate_proj.weight_scale": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.116.up_proj.weight": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.116.up_proj.weight_scale": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.117.down_proj.weight": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.117.down_proj.weight_scale": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.117.gate_proj.weight": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.117.gate_proj.weight_scale": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.117.up_proj.weight": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.117.up_proj.weight_scale": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.118.down_proj.weight": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.118.down_proj.weight_scale": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.118.gate_proj.weight": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.118.gate_proj.weight_scale": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.118.up_proj.weight": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.118.up_proj.weight_scale": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.119.down_proj.weight": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.119.down_proj.weight_scale": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.119.gate_proj.weight": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.119.gate_proj.weight_scale": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.119.up_proj.weight": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.119.up_proj.weight_scale": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.12.down_proj.weight": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.12.down_proj.weight_scale": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.12.gate_proj.weight": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.12.gate_proj.weight_scale": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.12.up_proj.weight": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.12.up_proj.weight_scale": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.120.down_proj.weight": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.120.down_proj.weight_scale": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.120.gate_proj.weight": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.120.gate_proj.weight_scale": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.120.up_proj.weight": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.120.up_proj.weight_scale": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.121.down_proj.weight": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.121.down_proj.weight_scale": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.121.gate_proj.weight": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.121.gate_proj.weight_scale": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.121.up_proj.weight": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.121.up_proj.weight_scale": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.122.down_proj.weight": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.122.down_proj.weight_scale": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.122.gate_proj.weight": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.122.gate_proj.weight_scale": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.122.up_proj.weight": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.122.up_proj.weight_scale": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.123.down_proj.weight": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.123.down_proj.weight_scale": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.123.gate_proj.weight": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.123.gate_proj.weight_scale": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.123.up_proj.weight": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.123.up_proj.weight_scale": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.124.down_proj.weight": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.124.down_proj.weight_scale": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.124.gate_proj.weight": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.124.gate_proj.weight_scale": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.124.up_proj.weight": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.124.up_proj.weight_scale": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.125.down_proj.weight": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.125.down_proj.weight_scale": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.125.gate_proj.weight": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.125.gate_proj.weight_scale": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.125.up_proj.weight": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.125.up_proj.weight_scale": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.126.down_proj.weight": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.126.down_proj.weight_scale": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.126.gate_proj.weight": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.126.gate_proj.weight_scale": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.126.up_proj.weight": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.126.up_proj.weight_scale": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.127.down_proj.weight": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.127.down_proj.weight_scale": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.127.gate_proj.weight": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.127.gate_proj.weight_scale": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.127.up_proj.weight": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.127.up_proj.weight_scale": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.128.down_proj.weight": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.128.down_proj.weight_scale": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.128.gate_proj.weight": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.128.gate_proj.weight_scale": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.128.up_proj.weight": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.128.up_proj.weight_scale": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.129.down_proj.weight": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.129.down_proj.weight_scale": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.129.gate_proj.weight": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.129.gate_proj.weight_scale": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.129.up_proj.weight": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.129.up_proj.weight_scale": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.13.down_proj.weight": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.13.down_proj.weight_scale": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.13.gate_proj.weight": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.13.gate_proj.weight_scale": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.13.up_proj.weight": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.13.up_proj.weight_scale": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.130.down_proj.weight": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.130.down_proj.weight_scale": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.130.gate_proj.weight": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.130.gate_proj.weight_scale": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.130.up_proj.weight": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.130.up_proj.weight_scale": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.131.down_proj.weight": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.131.down_proj.weight_scale": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.131.gate_proj.weight": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.131.gate_proj.weight_scale": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.131.up_proj.weight": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.131.up_proj.weight_scale": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.132.down_proj.weight": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.132.down_proj.weight_scale": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.132.gate_proj.weight": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.132.gate_proj.weight_scale": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.132.up_proj.weight": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.132.up_proj.weight_scale": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.133.down_proj.weight": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.133.down_proj.weight_scale": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.133.gate_proj.weight": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.133.gate_proj.weight_scale": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.133.up_proj.weight": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.133.up_proj.weight_scale": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.134.down_proj.weight": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.134.down_proj.weight_scale": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.134.gate_proj.weight": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.134.gate_proj.weight_scale": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.134.up_proj.weight": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.134.up_proj.weight_scale": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.135.down_proj.weight": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.135.down_proj.weight_scale": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.135.gate_proj.weight": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.135.gate_proj.weight_scale": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.135.up_proj.weight": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.135.up_proj.weight_scale": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.136.down_proj.weight": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.136.down_proj.weight_scale": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.136.gate_proj.weight": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.136.gate_proj.weight_scale": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.136.up_proj.weight": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.136.up_proj.weight_scale": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.137.down_proj.weight": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.137.down_proj.weight_scale": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.137.gate_proj.weight": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.137.gate_proj.weight_scale": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.137.up_proj.weight": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.137.up_proj.weight_scale": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.138.down_proj.weight": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.138.down_proj.weight_scale": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.138.gate_proj.weight": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.138.gate_proj.weight_scale": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.138.up_proj.weight": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.138.up_proj.weight_scale": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.139.down_proj.weight": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.139.down_proj.weight_scale": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.139.gate_proj.weight": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.139.gate_proj.weight_scale": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.139.up_proj.weight": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.139.up_proj.weight_scale": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.14.down_proj.weight": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.14.down_proj.weight_scale": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.14.gate_proj.weight": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.14.gate_proj.weight_scale": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.14.up_proj.weight": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.14.up_proj.weight_scale": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.140.down_proj.weight": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.140.down_proj.weight_scale": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.140.gate_proj.weight": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.140.gate_proj.weight_scale": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.140.up_proj.weight": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.140.up_proj.weight_scale": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.141.down_proj.weight": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.141.down_proj.weight_scale": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.141.gate_proj.weight": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.141.gate_proj.weight_scale": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.141.up_proj.weight": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.141.up_proj.weight_scale": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.142.down_proj.weight": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.142.down_proj.weight_scale": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.142.gate_proj.weight": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.142.gate_proj.weight_scale": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.142.up_proj.weight": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.142.up_proj.weight_scale": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.143.down_proj.weight": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.143.down_proj.weight_scale": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.143.gate_proj.weight": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.143.gate_proj.weight_scale": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.143.up_proj.weight": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.143.up_proj.weight_scale": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.144.down_proj.weight": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.144.down_proj.weight_scale": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.144.gate_proj.weight": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.144.gate_proj.weight_scale": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.144.up_proj.weight": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.144.up_proj.weight_scale": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.145.down_proj.weight": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.145.down_proj.weight_scale": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.145.gate_proj.weight": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.145.gate_proj.weight_scale": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.145.up_proj.weight": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.145.up_proj.weight_scale": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.146.down_proj.weight": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.146.down_proj.weight_scale": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.146.gate_proj.weight": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.146.gate_proj.weight_scale": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.146.up_proj.weight": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.146.up_proj.weight_scale": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.147.down_proj.weight": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.147.down_proj.weight_scale": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.147.gate_proj.weight": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.147.gate_proj.weight_scale": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.147.up_proj.weight": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.147.up_proj.weight_scale": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.148.down_proj.weight": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.148.down_proj.weight_scale": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.148.gate_proj.weight": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.148.gate_proj.weight_scale": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.148.up_proj.weight": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.148.up_proj.weight_scale": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.149.down_proj.weight": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.149.down_proj.weight_scale": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.149.gate_proj.weight": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.149.gate_proj.weight_scale": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.149.up_proj.weight": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.149.up_proj.weight_scale": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.15.down_proj.weight": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.15.down_proj.weight_scale": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.15.gate_proj.weight": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.15.gate_proj.weight_scale": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.15.up_proj.weight": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.15.up_proj.weight_scale": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.150.down_proj.weight": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.150.down_proj.weight_scale": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.150.gate_proj.weight": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.150.gate_proj.weight_scale": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.150.up_proj.weight": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.150.up_proj.weight_scale": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.151.down_proj.weight": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.151.down_proj.weight_scale": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.151.gate_proj.weight": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.151.gate_proj.weight_scale": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.151.up_proj.weight": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.151.up_proj.weight_scale": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.152.down_proj.weight": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.152.down_proj.weight_scale": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.152.gate_proj.weight": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.152.gate_proj.weight_scale": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.152.up_proj.weight": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.152.up_proj.weight_scale": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.153.down_proj.weight": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.153.down_proj.weight_scale": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.153.gate_proj.weight": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.153.gate_proj.weight_scale": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.153.up_proj.weight": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.153.up_proj.weight_scale": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.154.down_proj.weight": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.154.down_proj.weight_scale": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.154.gate_proj.weight": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.154.gate_proj.weight_scale": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.154.up_proj.weight": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.154.up_proj.weight_scale": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.155.down_proj.weight": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.155.down_proj.weight_scale": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.155.gate_proj.weight": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.155.gate_proj.weight_scale": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.155.up_proj.weight": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.155.up_proj.weight_scale": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.156.down_proj.weight": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.156.down_proj.weight_scale": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.156.gate_proj.weight": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.156.gate_proj.weight_scale": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.156.up_proj.weight": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.156.up_proj.weight_scale": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.157.down_proj.weight": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.157.down_proj.weight_scale": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.157.gate_proj.weight": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.157.gate_proj.weight_scale": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.157.up_proj.weight": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.157.up_proj.weight_scale": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.158.down_proj.weight": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.158.down_proj.weight_scale": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.158.gate_proj.weight": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.158.gate_proj.weight_scale": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.158.up_proj.weight": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.158.up_proj.weight_scale": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.159.down_proj.weight": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.159.down_proj.weight_scale": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.159.gate_proj.weight": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.159.gate_proj.weight_scale": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.159.up_proj.weight": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.159.up_proj.weight_scale": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.16.down_proj.weight": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.16.down_proj.weight_scale": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.16.gate_proj.weight": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.16.gate_proj.weight_scale": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.16.up_proj.weight": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.16.up_proj.weight_scale": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.17.down_proj.weight": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.17.down_proj.weight_scale": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.17.gate_proj.weight": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.17.gate_proj.weight_scale": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.17.up_proj.weight": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.17.up_proj.weight_scale": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.18.down_proj.weight": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.18.down_proj.weight_scale": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.18.gate_proj.weight": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.18.gate_proj.weight_scale": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.18.up_proj.weight": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.18.up_proj.weight_scale": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.19.down_proj.weight": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.19.down_proj.weight_scale": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.19.gate_proj.weight": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.19.gate_proj.weight_scale": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.19.up_proj.weight": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.19.up_proj.weight_scale": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.2.down_proj.weight": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.2.down_proj.weight_scale": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.2.gate_proj.weight": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.2.gate_proj.weight_scale": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.2.up_proj.weight": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.2.up_proj.weight_scale": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.20.down_proj.weight": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.20.down_proj.weight_scale": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.20.gate_proj.weight": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.20.gate_proj.weight_scale": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.20.up_proj.weight": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.20.up_proj.weight_scale": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.21.down_proj.weight": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.21.down_proj.weight_scale": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.21.gate_proj.weight": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.21.gate_proj.weight_scale": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.21.up_proj.weight": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.21.up_proj.weight_scale": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.22.down_proj.weight": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.22.down_proj.weight_scale": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.22.gate_proj.weight": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.22.gate_proj.weight_scale": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.22.up_proj.weight": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.22.up_proj.weight_scale": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.23.down_proj.weight": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.23.down_proj.weight_scale": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.23.gate_proj.weight": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.23.gate_proj.weight_scale": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.23.up_proj.weight": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.23.up_proj.weight_scale": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.24.down_proj.weight": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.24.down_proj.weight_scale": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.24.gate_proj.weight": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.24.gate_proj.weight_scale": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.24.up_proj.weight": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.24.up_proj.weight_scale": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.25.down_proj.weight": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.25.down_proj.weight_scale": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.25.gate_proj.weight": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.25.gate_proj.weight_scale": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.25.up_proj.weight": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.25.up_proj.weight_scale": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.26.down_proj.weight": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.26.down_proj.weight_scale": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.26.gate_proj.weight": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.26.gate_proj.weight_scale": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.26.up_proj.weight": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.26.up_proj.weight_scale": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.27.down_proj.weight": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.27.down_proj.weight_scale": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.27.gate_proj.weight": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.27.gate_proj.weight_scale": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.27.up_proj.weight": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.27.up_proj.weight_scale": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.28.down_proj.weight": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.28.down_proj.weight_scale": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.28.gate_proj.weight": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.28.gate_proj.weight_scale": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.28.up_proj.weight": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.28.up_proj.weight_scale": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.29.down_proj.weight": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.29.down_proj.weight_scale": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.29.gate_proj.weight": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.29.gate_proj.weight_scale": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.29.up_proj.weight": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.29.up_proj.weight_scale": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.3.down_proj.weight": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.3.down_proj.weight_scale": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.3.gate_proj.weight": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.3.gate_proj.weight_scale": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.3.up_proj.weight": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.3.up_proj.weight_scale": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.30.down_proj.weight": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.30.down_proj.weight_scale": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.30.gate_proj.weight": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.30.gate_proj.weight_scale": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.30.up_proj.weight": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.30.up_proj.weight_scale": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.31.down_proj.weight": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.31.down_proj.weight_scale": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.31.gate_proj.weight": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.31.gate_proj.weight_scale": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.31.up_proj.weight": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.31.up_proj.weight_scale": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.32.down_proj.weight": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.32.down_proj.weight_scale": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.32.gate_proj.weight": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.32.gate_proj.weight_scale": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.32.up_proj.weight": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.32.up_proj.weight_scale": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.33.down_proj.weight": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.33.down_proj.weight_scale": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.33.gate_proj.weight": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.33.gate_proj.weight_scale": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.33.up_proj.weight": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.33.up_proj.weight_scale": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.34.down_proj.weight": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.34.down_proj.weight_scale": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.34.gate_proj.weight": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.34.gate_proj.weight_scale": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.34.up_proj.weight": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.34.up_proj.weight_scale": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.35.down_proj.weight": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.35.down_proj.weight_scale": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.35.gate_proj.weight": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.35.gate_proj.weight_scale": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.35.up_proj.weight": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.35.up_proj.weight_scale": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.36.down_proj.weight": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.36.down_proj.weight_scale": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.36.gate_proj.weight": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.36.gate_proj.weight_scale": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.36.up_proj.weight": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.36.up_proj.weight_scale": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.37.down_proj.weight": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.37.down_proj.weight_scale": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.37.gate_proj.weight": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.37.gate_proj.weight_scale": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.37.up_proj.weight": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.37.up_proj.weight_scale": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.38.down_proj.weight": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.38.down_proj.weight_scale": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.38.gate_proj.weight": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.38.gate_proj.weight_scale": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.38.up_proj.weight": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.38.up_proj.weight_scale": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.39.down_proj.weight": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.39.down_proj.weight_scale": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.39.gate_proj.weight": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.39.gate_proj.weight_scale": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.39.up_proj.weight": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.39.up_proj.weight_scale": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.4.down_proj.weight": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.4.down_proj.weight_scale": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.4.gate_proj.weight": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.4.gate_proj.weight_scale": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.4.up_proj.weight": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.4.up_proj.weight_scale": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.40.down_proj.weight": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.40.down_proj.weight_scale": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.40.gate_proj.weight": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.40.gate_proj.weight_scale": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.40.up_proj.weight": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.40.up_proj.weight_scale": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.41.down_proj.weight": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.41.down_proj.weight_scale": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.41.gate_proj.weight": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.41.gate_proj.weight_scale": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.41.up_proj.weight": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.41.up_proj.weight_scale": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.42.down_proj.weight": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.42.down_proj.weight_scale": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.42.gate_proj.weight": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.42.gate_proj.weight_scale": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.42.up_proj.weight": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.42.up_proj.weight_scale": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.43.down_proj.weight": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.43.down_proj.weight_scale": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.43.gate_proj.weight": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.43.gate_proj.weight_scale": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.43.up_proj.weight": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.43.up_proj.weight_scale": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.44.down_proj.weight": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.44.down_proj.weight_scale": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.44.gate_proj.weight": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.44.gate_proj.weight_scale": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.44.up_proj.weight": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.44.up_proj.weight_scale": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.45.down_proj.weight": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.45.down_proj.weight_scale": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.45.gate_proj.weight": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.45.gate_proj.weight_scale": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.45.up_proj.weight": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.45.up_proj.weight_scale": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.46.down_proj.weight": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.46.down_proj.weight_scale": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.46.gate_proj.weight": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.46.gate_proj.weight_scale": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.46.up_proj.weight": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.46.up_proj.weight_scale": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.47.down_proj.weight": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.47.down_proj.weight_scale": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.47.gate_proj.weight": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.47.gate_proj.weight_scale": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.47.up_proj.weight": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.47.up_proj.weight_scale": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.48.down_proj.weight": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.48.down_proj.weight_scale": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.48.gate_proj.weight": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.48.gate_proj.weight_scale": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.48.up_proj.weight": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.48.up_proj.weight_scale": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.49.down_proj.weight": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.49.down_proj.weight_scale": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.49.gate_proj.weight": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.49.gate_proj.weight_scale": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.49.up_proj.weight": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.49.up_proj.weight_scale": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.5.down_proj.weight": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.5.down_proj.weight_scale": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.5.gate_proj.weight": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.5.gate_proj.weight_scale": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.5.up_proj.weight": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.5.up_proj.weight_scale": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.50.down_proj.weight": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.50.down_proj.weight_scale": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.50.gate_proj.weight": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.50.gate_proj.weight_scale": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.50.up_proj.weight": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.50.up_proj.weight_scale": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.51.down_proj.weight": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.51.down_proj.weight_scale": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.51.gate_proj.weight": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.51.gate_proj.weight_scale": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.51.up_proj.weight": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.51.up_proj.weight_scale": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.52.down_proj.weight": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.52.down_proj.weight_scale": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.52.gate_proj.weight": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.52.gate_proj.weight_scale": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.52.up_proj.weight": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.52.up_proj.weight_scale": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.53.down_proj.weight": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.53.down_proj.weight_scale": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.53.gate_proj.weight": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.53.gate_proj.weight_scale": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.53.up_proj.weight": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.53.up_proj.weight_scale": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.54.down_proj.weight": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.54.down_proj.weight_scale": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.54.gate_proj.weight": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.54.gate_proj.weight_scale": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.54.up_proj.weight": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.54.up_proj.weight_scale": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.55.down_proj.weight": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.55.down_proj.weight_scale": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.55.gate_proj.weight": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.55.gate_proj.weight_scale": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.55.up_proj.weight": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.55.up_proj.weight_scale": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.56.down_proj.weight": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.56.down_proj.weight_scale": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.56.gate_proj.weight": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.56.gate_proj.weight_scale": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.56.up_proj.weight": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.56.up_proj.weight_scale": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.57.down_proj.weight": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.57.down_proj.weight_scale": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.57.gate_proj.weight": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.57.gate_proj.weight_scale": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.57.up_proj.weight": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.57.up_proj.weight_scale": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.58.down_proj.weight": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.58.down_proj.weight_scale": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.58.gate_proj.weight": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.58.gate_proj.weight_scale": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.58.up_proj.weight": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.58.up_proj.weight_scale": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.59.down_proj.weight": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.59.down_proj.weight_scale": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.59.gate_proj.weight": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.59.gate_proj.weight_scale": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.59.up_proj.weight": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.59.up_proj.weight_scale": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.6.down_proj.weight": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.6.down_proj.weight_scale": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.6.gate_proj.weight": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.6.gate_proj.weight_scale": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.6.up_proj.weight": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.6.up_proj.weight_scale": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.60.down_proj.weight": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.60.down_proj.weight_scale": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.60.gate_proj.weight": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.60.gate_proj.weight_scale": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.60.up_proj.weight": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.60.up_proj.weight_scale": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.61.down_proj.weight": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.61.down_proj.weight_scale": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.61.gate_proj.weight": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.61.gate_proj.weight_scale": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.61.up_proj.weight": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.61.up_proj.weight_scale": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.62.down_proj.weight": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.62.down_proj.weight_scale": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.62.gate_proj.weight": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.62.gate_proj.weight_scale": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.62.up_proj.weight": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.62.up_proj.weight_scale": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.63.down_proj.weight": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.63.down_proj.weight_scale": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.63.gate_proj.weight": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.63.gate_proj.weight_scale": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.63.up_proj.weight": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.63.up_proj.weight_scale": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.64.down_proj.weight": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.64.down_proj.weight_scale": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.64.gate_proj.weight": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.64.gate_proj.weight_scale": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.64.up_proj.weight": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.64.up_proj.weight_scale": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.65.down_proj.weight": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.65.down_proj.weight_scale": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.65.gate_proj.weight": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.65.gate_proj.weight_scale": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.65.up_proj.weight": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.65.up_proj.weight_scale": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.66.down_proj.weight": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.66.down_proj.weight_scale": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.66.gate_proj.weight": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.66.gate_proj.weight_scale": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.66.up_proj.weight": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.66.up_proj.weight_scale": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.67.down_proj.weight": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.67.down_proj.weight_scale": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.67.gate_proj.weight": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.67.gate_proj.weight_scale": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.67.up_proj.weight": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.67.up_proj.weight_scale": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.68.down_proj.weight": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.68.down_proj.weight_scale": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.68.gate_proj.weight": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.68.gate_proj.weight_scale": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.68.up_proj.weight": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.68.up_proj.weight_scale": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.69.down_proj.weight": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.69.down_proj.weight_scale": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.69.gate_proj.weight": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.69.gate_proj.weight_scale": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.69.up_proj.weight": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.69.up_proj.weight_scale": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.7.down_proj.weight": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.7.down_proj.weight_scale": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.7.gate_proj.weight": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.7.gate_proj.weight_scale": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.7.up_proj.weight": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.7.up_proj.weight_scale": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.70.down_proj.weight": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.70.down_proj.weight_scale": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.70.gate_proj.weight": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.70.gate_proj.weight_scale": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.70.up_proj.weight": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.70.up_proj.weight_scale": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.71.down_proj.weight": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.71.down_proj.weight_scale": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.71.gate_proj.weight": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.71.gate_proj.weight_scale": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.71.up_proj.weight": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.71.up_proj.weight_scale": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.72.down_proj.weight": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.72.down_proj.weight_scale": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.72.gate_proj.weight": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.72.gate_proj.weight_scale": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.72.up_proj.weight": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.72.up_proj.weight_scale": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.73.down_proj.weight": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.73.down_proj.weight_scale": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.73.gate_proj.weight": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.73.gate_proj.weight_scale": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.73.up_proj.weight": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.73.up_proj.weight_scale": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.74.down_proj.weight": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.74.down_proj.weight_scale": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.74.gate_proj.weight": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.74.gate_proj.weight_scale": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.74.up_proj.weight": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.74.up_proj.weight_scale": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.75.down_proj.weight": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.75.down_proj.weight_scale": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.75.gate_proj.weight": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.75.gate_proj.weight_scale": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.75.up_proj.weight": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.75.up_proj.weight_scale": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.76.down_proj.weight": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.76.down_proj.weight_scale": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.76.gate_proj.weight": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.76.gate_proj.weight_scale": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.76.up_proj.weight": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.76.up_proj.weight_scale": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.77.down_proj.weight": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.77.down_proj.weight_scale": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.77.gate_proj.weight": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.77.gate_proj.weight_scale": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.77.up_proj.weight": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.77.up_proj.weight_scale": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.78.down_proj.weight": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.78.down_proj.weight_scale": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.78.gate_proj.weight": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.78.gate_proj.weight_scale": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.78.up_proj.weight": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.78.up_proj.weight_scale": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.79.down_proj.weight": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.79.down_proj.weight_scale": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.79.gate_proj.weight": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.79.gate_proj.weight_scale": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.79.up_proj.weight": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.79.up_proj.weight_scale": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.8.down_proj.weight": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.8.down_proj.weight_scale": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.8.gate_proj.weight": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.8.gate_proj.weight_scale": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.8.up_proj.weight": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.8.up_proj.weight_scale": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.80.down_proj.weight": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.80.down_proj.weight_scale": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.80.gate_proj.weight": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.80.gate_proj.weight_scale": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.80.up_proj.weight": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.80.up_proj.weight_scale": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.81.down_proj.weight": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.81.down_proj.weight_scale": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.81.gate_proj.weight": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.81.gate_proj.weight_scale": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.81.up_proj.weight": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.81.up_proj.weight_scale": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.82.down_proj.weight": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.82.down_proj.weight_scale": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.82.gate_proj.weight": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.82.gate_proj.weight_scale": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.82.up_proj.weight": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.82.up_proj.weight_scale": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.83.down_proj.weight": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.83.down_proj.weight_scale": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.83.gate_proj.weight": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.83.gate_proj.weight_scale": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.83.up_proj.weight": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.83.up_proj.weight_scale": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.84.down_proj.weight": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.84.down_proj.weight_scale": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.84.gate_proj.weight": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.84.gate_proj.weight_scale": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.84.up_proj.weight": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.84.up_proj.weight_scale": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.85.down_proj.weight": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.85.down_proj.weight_scale": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.85.gate_proj.weight": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.85.gate_proj.weight_scale": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.85.up_proj.weight": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.85.up_proj.weight_scale": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.86.down_proj.weight": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.86.down_proj.weight_scale": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.86.gate_proj.weight": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.86.gate_proj.weight_scale": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.86.up_proj.weight": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.86.up_proj.weight_scale": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.87.down_proj.weight": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.87.down_proj.weight_scale": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.87.gate_proj.weight": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.87.gate_proj.weight_scale": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.87.up_proj.weight": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.87.up_proj.weight_scale": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.88.down_proj.weight": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.88.down_proj.weight_scale": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.88.gate_proj.weight": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.88.gate_proj.weight_scale": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.88.up_proj.weight": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.88.up_proj.weight_scale": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.89.down_proj.weight": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.89.down_proj.weight_scale": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.89.gate_proj.weight": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.89.gate_proj.weight_scale": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.89.up_proj.weight": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.89.up_proj.weight_scale": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.9.down_proj.weight": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.9.down_proj.weight_scale": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.9.gate_proj.weight": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.9.gate_proj.weight_scale": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.9.up_proj.weight": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.9.up_proj.weight_scale": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.90.down_proj.weight": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.90.down_proj.weight_scale": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.90.gate_proj.weight": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.90.gate_proj.weight_scale": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.90.up_proj.weight": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.90.up_proj.weight_scale": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.91.down_proj.weight": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.91.down_proj.weight_scale": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.91.gate_proj.weight": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.91.gate_proj.weight_scale": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.91.up_proj.weight": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.91.up_proj.weight_scale": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.92.down_proj.weight": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.92.down_proj.weight_scale": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.92.gate_proj.weight": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.92.gate_proj.weight_scale": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.92.up_proj.weight": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.92.up_proj.weight_scale": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.93.down_proj.weight": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.93.down_proj.weight_scale": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.93.gate_proj.weight": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.93.gate_proj.weight_scale": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.93.up_proj.weight": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.93.up_proj.weight_scale": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.94.down_proj.weight": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.94.down_proj.weight_scale": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.94.gate_proj.weight": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.94.gate_proj.weight_scale": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.94.up_proj.weight": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.94.up_proj.weight_scale": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.95.down_proj.weight": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.95.down_proj.weight_scale": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.95.gate_proj.weight": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.95.gate_proj.weight_scale": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.95.up_proj.weight": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.95.up_proj.weight_scale": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.96.down_proj.weight": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.96.down_proj.weight_scale": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.96.gate_proj.weight": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.96.gate_proj.weight_scale": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.96.up_proj.weight": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.96.up_proj.weight_scale": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.97.down_proj.weight": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.97.down_proj.weight_scale": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.97.gate_proj.weight": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.97.gate_proj.weight_scale": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.97.up_proj.weight": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.97.up_proj.weight_scale": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.98.down_proj.weight": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.98.down_proj.weight_scale": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.98.gate_proj.weight": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.98.gate_proj.weight_scale": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.98.up_proj.weight": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.98.up_proj.weight_scale": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.99.down_proj.weight": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.99.down_proj.weight_scale": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.99.gate_proj.weight": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.99.gate_proj.weight_scale": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.99.up_proj.weight": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.99.up_proj.weight_scale": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.gate.e_score_correction_bias": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.gate.weight": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.shared_experts.down_proj.weight": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.shared_experts.down_proj.weight_scale": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.shared_experts.gate_proj.weight": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.shared_experts.gate_proj.weight_scale": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.shared_experts.up_proj.weight": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.shared_experts.up_proj.weight_scale": "model-00010-of-00092.safetensors",
+ "model.layers.9.post_attention_layernorm.weight": "model-00010-of-00092.safetensors",
+ "model.layers.9.self_attn.k_norm.weight": "model-00010-of-00092.safetensors",
+ "model.layers.9.self_attn.k_proj.bias": "model-00010-of-00092.safetensors",
+ "model.layers.9.self_attn.k_proj.weight": "model-00010-of-00092.safetensors",
+ "model.layers.9.self_attn.k_proj.weight_scale": "model-00010-of-00092.safetensors",
+ "model.layers.9.self_attn.o_proj.weight": "model-00010-of-00092.safetensors",
+ "model.layers.9.self_attn.o_proj.weight_scale": "model-00010-of-00092.safetensors",
+ "model.layers.9.self_attn.q_norm.weight": "model-00010-of-00092.safetensors",
+ "model.layers.9.self_attn.q_proj.bias": "model-00010-of-00092.safetensors",
+ "model.layers.9.self_attn.q_proj.weight": "model-00010-of-00092.safetensors",
+ "model.layers.9.self_attn.q_proj.weight_scale": "model-00010-of-00092.safetensors",
+ "model.layers.9.self_attn.v_proj.bias": "model-00010-of-00092.safetensors",
+ "model.layers.9.self_attn.v_proj.weight": "model-00010-of-00092.safetensors",
+ "model.layers.9.self_attn.v_proj.weight_scale": "model-00010-of-00092.safetensors",
+ "model.layers.10.input_layernorm.weight": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.0.down_proj.weight": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.0.down_proj.weight_scale": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.0.gate_proj.weight": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.0.gate_proj.weight_scale": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.0.up_proj.weight": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.0.up_proj.weight_scale": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.1.down_proj.weight": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.1.down_proj.weight_scale": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.1.gate_proj.weight": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.1.gate_proj.weight_scale": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.1.up_proj.weight": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.1.up_proj.weight_scale": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.10.down_proj.weight": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.10.down_proj.weight_scale": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.10.gate_proj.weight": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.10.gate_proj.weight_scale": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.10.up_proj.weight": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.10.up_proj.weight_scale": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.100.down_proj.weight": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.100.down_proj.weight_scale": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.100.gate_proj.weight": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.100.gate_proj.weight_scale": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.100.up_proj.weight": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.100.up_proj.weight_scale": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.101.down_proj.weight": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.101.down_proj.weight_scale": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.101.gate_proj.weight": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.101.gate_proj.weight_scale": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.101.up_proj.weight": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.101.up_proj.weight_scale": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.102.down_proj.weight": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.102.down_proj.weight_scale": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.102.gate_proj.weight": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.102.gate_proj.weight_scale": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.102.up_proj.weight": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.102.up_proj.weight_scale": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.103.down_proj.weight": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.103.down_proj.weight_scale": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.103.gate_proj.weight": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.103.gate_proj.weight_scale": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.103.up_proj.weight": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.103.up_proj.weight_scale": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.104.down_proj.weight": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.104.down_proj.weight_scale": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.104.gate_proj.weight": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.104.gate_proj.weight_scale": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.104.up_proj.weight": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.104.up_proj.weight_scale": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.105.down_proj.weight": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.105.down_proj.weight_scale": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.105.gate_proj.weight": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.105.gate_proj.weight_scale": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.105.up_proj.weight": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.105.up_proj.weight_scale": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.106.down_proj.weight": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.106.down_proj.weight_scale": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.106.gate_proj.weight": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.106.gate_proj.weight_scale": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.106.up_proj.weight": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.106.up_proj.weight_scale": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.107.down_proj.weight": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.107.down_proj.weight_scale": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.107.gate_proj.weight": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.107.gate_proj.weight_scale": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.107.up_proj.weight": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.107.up_proj.weight_scale": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.108.down_proj.weight": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.108.down_proj.weight_scale": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.108.gate_proj.weight": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.108.gate_proj.weight_scale": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.108.up_proj.weight": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.108.up_proj.weight_scale": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.109.down_proj.weight": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.109.down_proj.weight_scale": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.109.gate_proj.weight": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.109.gate_proj.weight_scale": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.109.up_proj.weight": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.109.up_proj.weight_scale": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.11.down_proj.weight": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.11.down_proj.weight_scale": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.11.gate_proj.weight": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.11.gate_proj.weight_scale": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.11.up_proj.weight": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.11.up_proj.weight_scale": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.110.down_proj.weight": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.110.down_proj.weight_scale": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.110.gate_proj.weight": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.110.gate_proj.weight_scale": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.110.up_proj.weight": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.110.up_proj.weight_scale": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.111.down_proj.weight": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.111.down_proj.weight_scale": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.111.gate_proj.weight": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.111.gate_proj.weight_scale": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.111.up_proj.weight": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.111.up_proj.weight_scale": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.112.down_proj.weight": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.112.down_proj.weight_scale": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.112.gate_proj.weight": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.112.gate_proj.weight_scale": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.112.up_proj.weight": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.112.up_proj.weight_scale": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.113.down_proj.weight": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.113.down_proj.weight_scale": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.113.gate_proj.weight": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.113.gate_proj.weight_scale": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.113.up_proj.weight": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.113.up_proj.weight_scale": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.114.down_proj.weight": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.114.down_proj.weight_scale": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.114.gate_proj.weight": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.114.gate_proj.weight_scale": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.114.up_proj.weight": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.114.up_proj.weight_scale": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.115.down_proj.weight": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.115.down_proj.weight_scale": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.115.gate_proj.weight": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.115.gate_proj.weight_scale": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.115.up_proj.weight": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.115.up_proj.weight_scale": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.116.down_proj.weight": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.116.down_proj.weight_scale": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.116.gate_proj.weight": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.116.gate_proj.weight_scale": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.116.up_proj.weight": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.116.up_proj.weight_scale": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.117.down_proj.weight": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.117.down_proj.weight_scale": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.117.gate_proj.weight": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.117.gate_proj.weight_scale": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.117.up_proj.weight": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.117.up_proj.weight_scale": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.118.down_proj.weight": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.118.down_proj.weight_scale": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.118.gate_proj.weight": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.118.gate_proj.weight_scale": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.118.up_proj.weight": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.118.up_proj.weight_scale": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.119.down_proj.weight": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.119.down_proj.weight_scale": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.119.gate_proj.weight": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.119.gate_proj.weight_scale": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.119.up_proj.weight": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.119.up_proj.weight_scale": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.12.down_proj.weight": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.12.down_proj.weight_scale": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.12.gate_proj.weight": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.12.gate_proj.weight_scale": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.12.up_proj.weight": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.12.up_proj.weight_scale": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.120.down_proj.weight": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.120.down_proj.weight_scale": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.120.gate_proj.weight": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.120.gate_proj.weight_scale": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.120.up_proj.weight": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.120.up_proj.weight_scale": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.121.down_proj.weight": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.121.down_proj.weight_scale": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.121.gate_proj.weight": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.121.gate_proj.weight_scale": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.121.up_proj.weight": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.121.up_proj.weight_scale": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.122.down_proj.weight": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.122.down_proj.weight_scale": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.122.gate_proj.weight": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.122.gate_proj.weight_scale": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.122.up_proj.weight": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.122.up_proj.weight_scale": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.123.down_proj.weight": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.123.down_proj.weight_scale": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.123.gate_proj.weight": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.123.gate_proj.weight_scale": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.123.up_proj.weight": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.123.up_proj.weight_scale": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.124.down_proj.weight": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.124.down_proj.weight_scale": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.124.gate_proj.weight": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.124.gate_proj.weight_scale": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.124.up_proj.weight": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.124.up_proj.weight_scale": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.125.down_proj.weight": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.125.down_proj.weight_scale": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.125.gate_proj.weight": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.125.gate_proj.weight_scale": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.125.up_proj.weight": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.125.up_proj.weight_scale": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.126.down_proj.weight": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.126.down_proj.weight_scale": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.126.gate_proj.weight": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.126.gate_proj.weight_scale": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.126.up_proj.weight": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.126.up_proj.weight_scale": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.127.down_proj.weight": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.127.down_proj.weight_scale": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.127.gate_proj.weight": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.127.gate_proj.weight_scale": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.127.up_proj.weight": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.127.up_proj.weight_scale": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.128.down_proj.weight": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.128.down_proj.weight_scale": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.128.gate_proj.weight": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.128.gate_proj.weight_scale": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.128.up_proj.weight": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.128.up_proj.weight_scale": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.129.down_proj.weight": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.129.down_proj.weight_scale": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.129.gate_proj.weight": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.129.gate_proj.weight_scale": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.129.up_proj.weight": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.129.up_proj.weight_scale": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.13.down_proj.weight": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.13.down_proj.weight_scale": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.13.gate_proj.weight": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.13.gate_proj.weight_scale": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.13.up_proj.weight": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.13.up_proj.weight_scale": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.130.down_proj.weight": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.130.down_proj.weight_scale": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.130.gate_proj.weight": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.130.gate_proj.weight_scale": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.130.up_proj.weight": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.130.up_proj.weight_scale": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.131.down_proj.weight": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.131.down_proj.weight_scale": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.131.gate_proj.weight": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.131.gate_proj.weight_scale": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.131.up_proj.weight": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.131.up_proj.weight_scale": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.132.down_proj.weight": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.132.down_proj.weight_scale": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.132.gate_proj.weight": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.132.gate_proj.weight_scale": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.132.up_proj.weight": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.132.up_proj.weight_scale": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.133.down_proj.weight": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.133.down_proj.weight_scale": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.133.gate_proj.weight": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.133.gate_proj.weight_scale": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.133.up_proj.weight": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.133.up_proj.weight_scale": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.134.down_proj.weight": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.134.down_proj.weight_scale": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.134.gate_proj.weight": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.134.gate_proj.weight_scale": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.134.up_proj.weight": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.134.up_proj.weight_scale": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.135.down_proj.weight": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.135.down_proj.weight_scale": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.135.gate_proj.weight": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.135.gate_proj.weight_scale": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.135.up_proj.weight": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.135.up_proj.weight_scale": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.136.down_proj.weight": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.136.down_proj.weight_scale": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.136.gate_proj.weight": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.136.gate_proj.weight_scale": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.136.up_proj.weight": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.136.up_proj.weight_scale": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.137.down_proj.weight": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.137.down_proj.weight_scale": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.137.gate_proj.weight": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.137.gate_proj.weight_scale": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.137.up_proj.weight": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.137.up_proj.weight_scale": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.138.down_proj.weight": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.138.down_proj.weight_scale": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.138.gate_proj.weight": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.138.gate_proj.weight_scale": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.138.up_proj.weight": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.138.up_proj.weight_scale": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.139.down_proj.weight": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.139.down_proj.weight_scale": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.139.gate_proj.weight": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.139.gate_proj.weight_scale": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.139.up_proj.weight": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.139.up_proj.weight_scale": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.14.down_proj.weight": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.14.down_proj.weight_scale": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.14.gate_proj.weight": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.14.gate_proj.weight_scale": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.14.up_proj.weight": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.14.up_proj.weight_scale": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.140.down_proj.weight": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.140.down_proj.weight_scale": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.140.gate_proj.weight": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.140.gate_proj.weight_scale": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.140.up_proj.weight": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.140.up_proj.weight_scale": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.141.down_proj.weight": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.141.down_proj.weight_scale": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.141.gate_proj.weight": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.141.gate_proj.weight_scale": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.141.up_proj.weight": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.141.up_proj.weight_scale": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.142.down_proj.weight": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.142.down_proj.weight_scale": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.142.gate_proj.weight": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.142.gate_proj.weight_scale": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.142.up_proj.weight": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.142.up_proj.weight_scale": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.143.down_proj.weight": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.143.down_proj.weight_scale": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.143.gate_proj.weight": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.143.gate_proj.weight_scale": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.143.up_proj.weight": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.143.up_proj.weight_scale": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.144.down_proj.weight": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.144.down_proj.weight_scale": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.144.gate_proj.weight": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.144.gate_proj.weight_scale": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.144.up_proj.weight": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.144.up_proj.weight_scale": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.145.down_proj.weight": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.145.down_proj.weight_scale": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.145.gate_proj.weight": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.145.gate_proj.weight_scale": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.145.up_proj.weight": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.145.up_proj.weight_scale": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.146.down_proj.weight": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.146.down_proj.weight_scale": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.146.gate_proj.weight": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.146.gate_proj.weight_scale": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.146.up_proj.weight": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.146.up_proj.weight_scale": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.147.down_proj.weight": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.147.down_proj.weight_scale": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.147.gate_proj.weight": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.147.gate_proj.weight_scale": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.147.up_proj.weight": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.147.up_proj.weight_scale": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.148.down_proj.weight": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.148.down_proj.weight_scale": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.148.gate_proj.weight": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.148.gate_proj.weight_scale": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.148.up_proj.weight": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.148.up_proj.weight_scale": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.149.down_proj.weight": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.149.down_proj.weight_scale": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.149.gate_proj.weight": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.149.gate_proj.weight_scale": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.149.up_proj.weight": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.149.up_proj.weight_scale": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.15.down_proj.weight": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.15.down_proj.weight_scale": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.15.gate_proj.weight": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.15.gate_proj.weight_scale": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.15.up_proj.weight": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.15.up_proj.weight_scale": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.150.down_proj.weight": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.150.down_proj.weight_scale": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.150.gate_proj.weight": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.150.gate_proj.weight_scale": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.150.up_proj.weight": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.150.up_proj.weight_scale": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.151.down_proj.weight": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.151.down_proj.weight_scale": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.151.gate_proj.weight": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.151.gate_proj.weight_scale": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.151.up_proj.weight": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.151.up_proj.weight_scale": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.152.down_proj.weight": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.152.down_proj.weight_scale": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.152.gate_proj.weight": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.152.gate_proj.weight_scale": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.152.up_proj.weight": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.152.up_proj.weight_scale": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.153.down_proj.weight": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.153.down_proj.weight_scale": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.153.gate_proj.weight": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.153.gate_proj.weight_scale": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.153.up_proj.weight": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.153.up_proj.weight_scale": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.154.down_proj.weight": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.154.down_proj.weight_scale": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.154.gate_proj.weight": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.154.gate_proj.weight_scale": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.154.up_proj.weight": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.154.up_proj.weight_scale": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.155.down_proj.weight": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.155.down_proj.weight_scale": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.155.gate_proj.weight": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.155.gate_proj.weight_scale": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.155.up_proj.weight": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.155.up_proj.weight_scale": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.156.down_proj.weight": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.156.down_proj.weight_scale": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.156.gate_proj.weight": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.156.gate_proj.weight_scale": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.156.up_proj.weight": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.156.up_proj.weight_scale": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.157.down_proj.weight": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.157.down_proj.weight_scale": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.157.gate_proj.weight": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.157.gate_proj.weight_scale": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.157.up_proj.weight": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.157.up_proj.weight_scale": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.158.down_proj.weight": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.158.down_proj.weight_scale": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.158.gate_proj.weight": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.158.gate_proj.weight_scale": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.158.up_proj.weight": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.158.up_proj.weight_scale": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.159.down_proj.weight": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.159.down_proj.weight_scale": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.159.gate_proj.weight": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.159.gate_proj.weight_scale": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.159.up_proj.weight": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.159.up_proj.weight_scale": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.16.down_proj.weight": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.16.down_proj.weight_scale": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.16.gate_proj.weight": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.16.gate_proj.weight_scale": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.16.up_proj.weight": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.16.up_proj.weight_scale": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.17.down_proj.weight": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.17.down_proj.weight_scale": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.17.gate_proj.weight": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.17.gate_proj.weight_scale": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.17.up_proj.weight": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.17.up_proj.weight_scale": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.18.down_proj.weight": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.18.down_proj.weight_scale": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.18.gate_proj.weight": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.18.gate_proj.weight_scale": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.18.up_proj.weight": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.18.up_proj.weight_scale": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.19.down_proj.weight": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.19.down_proj.weight_scale": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.19.gate_proj.weight": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.19.gate_proj.weight_scale": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.19.up_proj.weight": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.19.up_proj.weight_scale": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.2.down_proj.weight": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.2.down_proj.weight_scale": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.2.gate_proj.weight": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.2.gate_proj.weight_scale": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.2.up_proj.weight": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.2.up_proj.weight_scale": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.20.down_proj.weight": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.20.down_proj.weight_scale": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.20.gate_proj.weight": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.20.gate_proj.weight_scale": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.20.up_proj.weight": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.20.up_proj.weight_scale": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.21.down_proj.weight": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.21.down_proj.weight_scale": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.21.gate_proj.weight": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.21.gate_proj.weight_scale": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.21.up_proj.weight": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.21.up_proj.weight_scale": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.22.down_proj.weight": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.22.down_proj.weight_scale": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.22.gate_proj.weight": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.22.gate_proj.weight_scale": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.22.up_proj.weight": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.22.up_proj.weight_scale": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.23.down_proj.weight": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.23.down_proj.weight_scale": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.23.gate_proj.weight": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.23.gate_proj.weight_scale": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.23.up_proj.weight": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.23.up_proj.weight_scale": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.24.down_proj.weight": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.24.down_proj.weight_scale": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.24.gate_proj.weight": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.24.gate_proj.weight_scale": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.24.up_proj.weight": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.24.up_proj.weight_scale": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.25.down_proj.weight": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.25.down_proj.weight_scale": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.25.gate_proj.weight": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.25.gate_proj.weight_scale": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.25.up_proj.weight": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.25.up_proj.weight_scale": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.26.down_proj.weight": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.26.down_proj.weight_scale": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.26.gate_proj.weight": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.26.gate_proj.weight_scale": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.26.up_proj.weight": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.26.up_proj.weight_scale": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.27.down_proj.weight": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.27.down_proj.weight_scale": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.27.gate_proj.weight": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.27.gate_proj.weight_scale": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.27.up_proj.weight": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.27.up_proj.weight_scale": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.28.down_proj.weight": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.28.down_proj.weight_scale": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.28.gate_proj.weight": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.28.gate_proj.weight_scale": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.28.up_proj.weight": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.28.up_proj.weight_scale": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.29.down_proj.weight": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.29.down_proj.weight_scale": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.29.gate_proj.weight": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.29.gate_proj.weight_scale": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.29.up_proj.weight": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.29.up_proj.weight_scale": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.3.down_proj.weight": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.3.down_proj.weight_scale": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.3.gate_proj.weight": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.3.gate_proj.weight_scale": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.3.up_proj.weight": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.3.up_proj.weight_scale": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.30.down_proj.weight": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.30.down_proj.weight_scale": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.30.gate_proj.weight": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.30.gate_proj.weight_scale": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.30.up_proj.weight": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.30.up_proj.weight_scale": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.31.down_proj.weight": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.31.down_proj.weight_scale": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.31.gate_proj.weight": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.31.gate_proj.weight_scale": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.31.up_proj.weight": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.31.up_proj.weight_scale": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.32.down_proj.weight": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.32.down_proj.weight_scale": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.32.gate_proj.weight": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.32.gate_proj.weight_scale": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.32.up_proj.weight": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.32.up_proj.weight_scale": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.33.down_proj.weight": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.33.down_proj.weight_scale": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.33.gate_proj.weight": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.33.gate_proj.weight_scale": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.33.up_proj.weight": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.33.up_proj.weight_scale": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.34.down_proj.weight": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.34.down_proj.weight_scale": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.34.gate_proj.weight": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.34.gate_proj.weight_scale": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.34.up_proj.weight": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.34.up_proj.weight_scale": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.35.down_proj.weight": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.35.down_proj.weight_scale": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.35.gate_proj.weight": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.35.gate_proj.weight_scale": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.35.up_proj.weight": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.35.up_proj.weight_scale": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.36.down_proj.weight": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.36.down_proj.weight_scale": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.36.gate_proj.weight": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.36.gate_proj.weight_scale": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.36.up_proj.weight": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.36.up_proj.weight_scale": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.37.down_proj.weight": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.37.down_proj.weight_scale": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.37.gate_proj.weight": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.37.gate_proj.weight_scale": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.37.up_proj.weight": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.37.up_proj.weight_scale": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.38.down_proj.weight": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.38.down_proj.weight_scale": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.38.gate_proj.weight": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.38.gate_proj.weight_scale": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.38.up_proj.weight": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.38.up_proj.weight_scale": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.39.down_proj.weight": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.39.down_proj.weight_scale": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.39.gate_proj.weight": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.39.gate_proj.weight_scale": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.39.up_proj.weight": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.39.up_proj.weight_scale": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.4.down_proj.weight": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.4.down_proj.weight_scale": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.4.gate_proj.weight": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.4.gate_proj.weight_scale": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.4.up_proj.weight": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.4.up_proj.weight_scale": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.40.down_proj.weight": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.40.down_proj.weight_scale": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.40.gate_proj.weight": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.40.gate_proj.weight_scale": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.40.up_proj.weight": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.40.up_proj.weight_scale": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.41.down_proj.weight": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.41.down_proj.weight_scale": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.41.gate_proj.weight": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.41.gate_proj.weight_scale": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.41.up_proj.weight": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.41.up_proj.weight_scale": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.42.down_proj.weight": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.42.down_proj.weight_scale": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.42.gate_proj.weight": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.42.gate_proj.weight_scale": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.42.up_proj.weight": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.42.up_proj.weight_scale": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.43.down_proj.weight": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.43.down_proj.weight_scale": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.43.gate_proj.weight": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.43.gate_proj.weight_scale": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.43.up_proj.weight": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.43.up_proj.weight_scale": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.44.down_proj.weight": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.44.down_proj.weight_scale": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.44.gate_proj.weight": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.44.gate_proj.weight_scale": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.44.up_proj.weight": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.44.up_proj.weight_scale": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.45.down_proj.weight": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.45.down_proj.weight_scale": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.45.gate_proj.weight": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.45.gate_proj.weight_scale": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.45.up_proj.weight": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.45.up_proj.weight_scale": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.46.down_proj.weight": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.46.down_proj.weight_scale": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.46.gate_proj.weight": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.46.gate_proj.weight_scale": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.46.up_proj.weight": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.46.up_proj.weight_scale": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.47.down_proj.weight": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.47.down_proj.weight_scale": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.47.gate_proj.weight": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.47.gate_proj.weight_scale": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.47.up_proj.weight": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.47.up_proj.weight_scale": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.48.down_proj.weight": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.48.down_proj.weight_scale": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.48.gate_proj.weight": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.48.gate_proj.weight_scale": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.48.up_proj.weight": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.48.up_proj.weight_scale": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.49.down_proj.weight": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.49.down_proj.weight_scale": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.49.gate_proj.weight": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.49.gate_proj.weight_scale": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.49.up_proj.weight": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.49.up_proj.weight_scale": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.5.down_proj.weight": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.5.down_proj.weight_scale": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.5.gate_proj.weight": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.5.gate_proj.weight_scale": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.5.up_proj.weight": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.5.up_proj.weight_scale": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.50.down_proj.weight": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.50.down_proj.weight_scale": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.50.gate_proj.weight": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.50.gate_proj.weight_scale": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.50.up_proj.weight": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.50.up_proj.weight_scale": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.51.down_proj.weight": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.51.down_proj.weight_scale": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.51.gate_proj.weight": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.51.gate_proj.weight_scale": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.51.up_proj.weight": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.51.up_proj.weight_scale": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.52.down_proj.weight": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.52.down_proj.weight_scale": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.52.gate_proj.weight": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.52.gate_proj.weight_scale": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.52.up_proj.weight": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.52.up_proj.weight_scale": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.53.down_proj.weight": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.53.down_proj.weight_scale": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.53.gate_proj.weight": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.53.gate_proj.weight_scale": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.53.up_proj.weight": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.53.up_proj.weight_scale": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.54.down_proj.weight": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.54.down_proj.weight_scale": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.54.gate_proj.weight": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.54.gate_proj.weight_scale": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.54.up_proj.weight": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.54.up_proj.weight_scale": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.55.down_proj.weight": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.55.down_proj.weight_scale": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.55.gate_proj.weight": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.55.gate_proj.weight_scale": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.55.up_proj.weight": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.55.up_proj.weight_scale": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.56.down_proj.weight": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.56.down_proj.weight_scale": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.56.gate_proj.weight": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.56.gate_proj.weight_scale": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.56.up_proj.weight": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.56.up_proj.weight_scale": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.57.down_proj.weight": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.57.down_proj.weight_scale": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.57.gate_proj.weight": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.57.gate_proj.weight_scale": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.57.up_proj.weight": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.57.up_proj.weight_scale": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.58.down_proj.weight": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.58.down_proj.weight_scale": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.58.gate_proj.weight": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.58.gate_proj.weight_scale": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.58.up_proj.weight": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.58.up_proj.weight_scale": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.59.down_proj.weight": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.59.down_proj.weight_scale": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.59.gate_proj.weight": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.59.gate_proj.weight_scale": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.59.up_proj.weight": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.59.up_proj.weight_scale": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.6.down_proj.weight": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.6.down_proj.weight_scale": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.6.gate_proj.weight": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.6.gate_proj.weight_scale": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.6.up_proj.weight": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.6.up_proj.weight_scale": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.60.down_proj.weight": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.60.down_proj.weight_scale": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.60.gate_proj.weight": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.60.gate_proj.weight_scale": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.60.up_proj.weight": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.60.up_proj.weight_scale": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.61.down_proj.weight": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.61.down_proj.weight_scale": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.61.gate_proj.weight": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.61.gate_proj.weight_scale": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.61.up_proj.weight": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.61.up_proj.weight_scale": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.62.down_proj.weight": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.62.down_proj.weight_scale": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.62.gate_proj.weight": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.62.gate_proj.weight_scale": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.62.up_proj.weight": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.62.up_proj.weight_scale": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.63.down_proj.weight": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.63.down_proj.weight_scale": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.63.gate_proj.weight": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.63.gate_proj.weight_scale": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.63.up_proj.weight": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.63.up_proj.weight_scale": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.64.down_proj.weight": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.64.down_proj.weight_scale": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.64.gate_proj.weight": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.64.gate_proj.weight_scale": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.64.up_proj.weight": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.64.up_proj.weight_scale": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.65.down_proj.weight": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.65.down_proj.weight_scale": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.65.gate_proj.weight": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.65.gate_proj.weight_scale": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.65.up_proj.weight": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.65.up_proj.weight_scale": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.66.down_proj.weight": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.66.down_proj.weight_scale": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.66.gate_proj.weight": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.66.gate_proj.weight_scale": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.66.up_proj.weight": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.66.up_proj.weight_scale": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.67.down_proj.weight": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.67.down_proj.weight_scale": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.67.gate_proj.weight": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.67.gate_proj.weight_scale": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.67.up_proj.weight": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.67.up_proj.weight_scale": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.68.down_proj.weight": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.68.down_proj.weight_scale": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.68.gate_proj.weight": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.68.gate_proj.weight_scale": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.68.up_proj.weight": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.68.up_proj.weight_scale": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.69.down_proj.weight": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.69.down_proj.weight_scale": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.69.gate_proj.weight": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.69.gate_proj.weight_scale": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.69.up_proj.weight": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.69.up_proj.weight_scale": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.7.down_proj.weight": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.7.down_proj.weight_scale": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.7.gate_proj.weight": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.7.gate_proj.weight_scale": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.7.up_proj.weight": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.7.up_proj.weight_scale": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.70.down_proj.weight": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.70.down_proj.weight_scale": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.70.gate_proj.weight": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.70.gate_proj.weight_scale": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.70.up_proj.weight": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.70.up_proj.weight_scale": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.71.down_proj.weight": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.71.down_proj.weight_scale": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.71.gate_proj.weight": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.71.gate_proj.weight_scale": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.71.up_proj.weight": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.71.up_proj.weight_scale": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.72.down_proj.weight": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.72.down_proj.weight_scale": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.72.gate_proj.weight": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.72.gate_proj.weight_scale": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.72.up_proj.weight": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.72.up_proj.weight_scale": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.73.down_proj.weight": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.73.down_proj.weight_scale": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.73.gate_proj.weight": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.73.gate_proj.weight_scale": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.73.up_proj.weight": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.73.up_proj.weight_scale": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.74.down_proj.weight": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.74.down_proj.weight_scale": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.74.gate_proj.weight": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.74.gate_proj.weight_scale": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.74.up_proj.weight": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.74.up_proj.weight_scale": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.75.down_proj.weight": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.75.down_proj.weight_scale": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.75.gate_proj.weight": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.75.gate_proj.weight_scale": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.75.up_proj.weight": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.75.up_proj.weight_scale": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.76.down_proj.weight": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.76.down_proj.weight_scale": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.76.gate_proj.weight": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.76.gate_proj.weight_scale": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.76.up_proj.weight": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.76.up_proj.weight_scale": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.77.down_proj.weight": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.77.down_proj.weight_scale": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.77.gate_proj.weight": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.77.gate_proj.weight_scale": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.77.up_proj.weight": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.77.up_proj.weight_scale": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.78.down_proj.weight": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.78.down_proj.weight_scale": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.78.gate_proj.weight": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.78.gate_proj.weight_scale": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.78.up_proj.weight": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.78.up_proj.weight_scale": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.79.down_proj.weight": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.79.down_proj.weight_scale": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.79.gate_proj.weight": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.79.gate_proj.weight_scale": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.79.up_proj.weight": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.79.up_proj.weight_scale": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.8.down_proj.weight": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.8.down_proj.weight_scale": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.8.gate_proj.weight": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.8.gate_proj.weight_scale": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.8.up_proj.weight": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.8.up_proj.weight_scale": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.80.down_proj.weight": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.80.down_proj.weight_scale": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.80.gate_proj.weight": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.80.gate_proj.weight_scale": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.80.up_proj.weight": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.80.up_proj.weight_scale": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.81.down_proj.weight": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.81.down_proj.weight_scale": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.81.gate_proj.weight": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.81.gate_proj.weight_scale": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.81.up_proj.weight": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.81.up_proj.weight_scale": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.82.down_proj.weight": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.82.down_proj.weight_scale": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.82.gate_proj.weight": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.82.gate_proj.weight_scale": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.82.up_proj.weight": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.82.up_proj.weight_scale": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.83.down_proj.weight": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.83.down_proj.weight_scale": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.83.gate_proj.weight": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.83.gate_proj.weight_scale": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.83.up_proj.weight": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.83.up_proj.weight_scale": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.84.down_proj.weight": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.84.down_proj.weight_scale": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.84.gate_proj.weight": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.84.gate_proj.weight_scale": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.84.up_proj.weight": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.84.up_proj.weight_scale": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.85.down_proj.weight": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.85.down_proj.weight_scale": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.85.gate_proj.weight": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.85.gate_proj.weight_scale": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.85.up_proj.weight": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.85.up_proj.weight_scale": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.86.down_proj.weight": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.86.down_proj.weight_scale": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.86.gate_proj.weight": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.86.gate_proj.weight_scale": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.86.up_proj.weight": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.86.up_proj.weight_scale": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.87.down_proj.weight": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.87.down_proj.weight_scale": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.87.gate_proj.weight": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.87.gate_proj.weight_scale": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.87.up_proj.weight": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.87.up_proj.weight_scale": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.88.down_proj.weight": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.88.down_proj.weight_scale": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.88.gate_proj.weight": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.88.gate_proj.weight_scale": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.88.up_proj.weight": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.88.up_proj.weight_scale": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.89.down_proj.weight": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.89.down_proj.weight_scale": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.89.gate_proj.weight": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.89.gate_proj.weight_scale": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.89.up_proj.weight": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.89.up_proj.weight_scale": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.9.down_proj.weight": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.9.down_proj.weight_scale": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.9.gate_proj.weight": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.9.gate_proj.weight_scale": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.9.up_proj.weight": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.9.up_proj.weight_scale": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.90.down_proj.weight": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.90.down_proj.weight_scale": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.90.gate_proj.weight": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.90.gate_proj.weight_scale": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.90.up_proj.weight": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.90.up_proj.weight_scale": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.91.down_proj.weight": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.91.down_proj.weight_scale": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.91.gate_proj.weight": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.91.gate_proj.weight_scale": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.91.up_proj.weight": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.91.up_proj.weight_scale": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.92.down_proj.weight": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.92.down_proj.weight_scale": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.92.gate_proj.weight": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.92.gate_proj.weight_scale": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.92.up_proj.weight": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.92.up_proj.weight_scale": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.93.down_proj.weight": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.93.down_proj.weight_scale": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.93.gate_proj.weight": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.93.gate_proj.weight_scale": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.93.up_proj.weight": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.93.up_proj.weight_scale": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.94.down_proj.weight": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.94.down_proj.weight_scale": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.94.gate_proj.weight": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.94.gate_proj.weight_scale": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.94.up_proj.weight": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.94.up_proj.weight_scale": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.95.down_proj.weight": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.95.down_proj.weight_scale": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.95.gate_proj.weight": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.95.gate_proj.weight_scale": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.95.up_proj.weight": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.95.up_proj.weight_scale": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.96.down_proj.weight": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.96.down_proj.weight_scale": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.96.gate_proj.weight": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.96.gate_proj.weight_scale": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.96.up_proj.weight": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.96.up_proj.weight_scale": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.97.down_proj.weight": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.97.down_proj.weight_scale": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.97.gate_proj.weight": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.97.gate_proj.weight_scale": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.97.up_proj.weight": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.97.up_proj.weight_scale": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.98.down_proj.weight": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.98.down_proj.weight_scale": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.98.gate_proj.weight": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.98.gate_proj.weight_scale": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.98.up_proj.weight": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.98.up_proj.weight_scale": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.99.down_proj.weight": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.99.down_proj.weight_scale": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.99.gate_proj.weight": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.99.gate_proj.weight_scale": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.99.up_proj.weight": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.99.up_proj.weight_scale": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.gate.e_score_correction_bias": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.gate.weight": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.shared_experts.down_proj.weight": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.shared_experts.down_proj.weight_scale": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.shared_experts.gate_proj.weight": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.shared_experts.gate_proj.weight_scale": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.shared_experts.up_proj.weight": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.shared_experts.up_proj.weight_scale": "model-00011-of-00092.safetensors",
+ "model.layers.10.post_attention_layernorm.weight": "model-00011-of-00092.safetensors",
+ "model.layers.10.self_attn.k_norm.weight": "model-00011-of-00092.safetensors",
+ "model.layers.10.self_attn.k_proj.bias": "model-00011-of-00092.safetensors",
+ "model.layers.10.self_attn.k_proj.weight": "model-00011-of-00092.safetensors",
+ "model.layers.10.self_attn.k_proj.weight_scale": "model-00011-of-00092.safetensors",
+ "model.layers.10.self_attn.o_proj.weight": "model-00011-of-00092.safetensors",
+ "model.layers.10.self_attn.o_proj.weight_scale": "model-00011-of-00092.safetensors",
+ "model.layers.10.self_attn.q_norm.weight": "model-00011-of-00092.safetensors",
+ "model.layers.10.self_attn.q_proj.bias": "model-00011-of-00092.safetensors",
+ "model.layers.10.self_attn.q_proj.weight": "model-00011-of-00092.safetensors",
+ "model.layers.10.self_attn.q_proj.weight_scale": "model-00011-of-00092.safetensors",
+ "model.layers.10.self_attn.v_proj.bias": "model-00011-of-00092.safetensors",
+ "model.layers.10.self_attn.v_proj.weight": "model-00011-of-00092.safetensors",
+ "model.layers.10.self_attn.v_proj.weight_scale": "model-00011-of-00092.safetensors",
+ "model.layers.11.input_layernorm.weight": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.0.down_proj.weight": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.0.down_proj.weight_scale": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.0.gate_proj.weight": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.0.gate_proj.weight_scale": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.0.up_proj.weight": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.0.up_proj.weight_scale": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.1.down_proj.weight": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.1.down_proj.weight_scale": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.1.gate_proj.weight": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.1.gate_proj.weight_scale": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.1.up_proj.weight": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.1.up_proj.weight_scale": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.10.down_proj.weight": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.10.down_proj.weight_scale": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.10.gate_proj.weight": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.10.gate_proj.weight_scale": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.10.up_proj.weight": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.10.up_proj.weight_scale": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.100.down_proj.weight": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.100.down_proj.weight_scale": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.100.gate_proj.weight": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.100.gate_proj.weight_scale": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.100.up_proj.weight": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.100.up_proj.weight_scale": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.101.down_proj.weight": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.101.down_proj.weight_scale": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.101.gate_proj.weight": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.101.gate_proj.weight_scale": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.101.up_proj.weight": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.101.up_proj.weight_scale": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.102.down_proj.weight": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.102.down_proj.weight_scale": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.102.gate_proj.weight": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.102.gate_proj.weight_scale": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.102.up_proj.weight": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.102.up_proj.weight_scale": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.103.down_proj.weight": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.103.down_proj.weight_scale": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.103.gate_proj.weight": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.103.gate_proj.weight_scale": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.103.up_proj.weight": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.103.up_proj.weight_scale": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.104.down_proj.weight": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.104.down_proj.weight_scale": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.104.gate_proj.weight": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.104.gate_proj.weight_scale": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.104.up_proj.weight": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.104.up_proj.weight_scale": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.105.down_proj.weight": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.105.down_proj.weight_scale": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.105.gate_proj.weight": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.105.gate_proj.weight_scale": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.105.up_proj.weight": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.105.up_proj.weight_scale": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.106.down_proj.weight": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.106.down_proj.weight_scale": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.106.gate_proj.weight": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.106.gate_proj.weight_scale": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.106.up_proj.weight": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.106.up_proj.weight_scale": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.107.down_proj.weight": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.107.down_proj.weight_scale": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.107.gate_proj.weight": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.107.gate_proj.weight_scale": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.107.up_proj.weight": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.107.up_proj.weight_scale": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.108.down_proj.weight": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.108.down_proj.weight_scale": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.108.gate_proj.weight": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.108.gate_proj.weight_scale": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.108.up_proj.weight": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.108.up_proj.weight_scale": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.109.down_proj.weight": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.109.down_proj.weight_scale": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.109.gate_proj.weight": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.109.gate_proj.weight_scale": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.109.up_proj.weight": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.109.up_proj.weight_scale": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.11.down_proj.weight": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.11.down_proj.weight_scale": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.11.gate_proj.weight": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.11.gate_proj.weight_scale": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.11.up_proj.weight": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.11.up_proj.weight_scale": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.110.down_proj.weight": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.110.down_proj.weight_scale": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.110.gate_proj.weight": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.110.gate_proj.weight_scale": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.110.up_proj.weight": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.110.up_proj.weight_scale": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.111.down_proj.weight": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.111.down_proj.weight_scale": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.111.gate_proj.weight": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.111.gate_proj.weight_scale": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.111.up_proj.weight": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.111.up_proj.weight_scale": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.112.down_proj.weight": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.112.down_proj.weight_scale": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.112.gate_proj.weight": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.112.gate_proj.weight_scale": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.112.up_proj.weight": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.112.up_proj.weight_scale": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.113.down_proj.weight": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.113.down_proj.weight_scale": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.113.gate_proj.weight": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.113.gate_proj.weight_scale": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.113.up_proj.weight": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.113.up_proj.weight_scale": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.114.down_proj.weight": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.114.down_proj.weight_scale": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.114.gate_proj.weight": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.114.gate_proj.weight_scale": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.114.up_proj.weight": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.114.up_proj.weight_scale": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.115.down_proj.weight": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.115.down_proj.weight_scale": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.115.gate_proj.weight": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.115.gate_proj.weight_scale": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.115.up_proj.weight": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.115.up_proj.weight_scale": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.116.down_proj.weight": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.116.down_proj.weight_scale": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.116.gate_proj.weight": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.116.gate_proj.weight_scale": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.116.up_proj.weight": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.116.up_proj.weight_scale": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.117.down_proj.weight": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.117.down_proj.weight_scale": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.117.gate_proj.weight": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.117.gate_proj.weight_scale": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.117.up_proj.weight": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.117.up_proj.weight_scale": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.118.down_proj.weight": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.118.down_proj.weight_scale": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.118.gate_proj.weight": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.118.gate_proj.weight_scale": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.118.up_proj.weight": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.118.up_proj.weight_scale": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.119.down_proj.weight": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.119.down_proj.weight_scale": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.119.gate_proj.weight": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.119.gate_proj.weight_scale": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.119.up_proj.weight": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.119.up_proj.weight_scale": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.12.down_proj.weight": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.12.down_proj.weight_scale": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.12.gate_proj.weight": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.12.gate_proj.weight_scale": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.12.up_proj.weight": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.12.up_proj.weight_scale": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.120.down_proj.weight": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.120.down_proj.weight_scale": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.120.gate_proj.weight": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.120.gate_proj.weight_scale": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.120.up_proj.weight": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.120.up_proj.weight_scale": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.121.down_proj.weight": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.121.down_proj.weight_scale": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.121.gate_proj.weight": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.121.gate_proj.weight_scale": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.121.up_proj.weight": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.121.up_proj.weight_scale": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.122.down_proj.weight": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.122.down_proj.weight_scale": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.122.gate_proj.weight": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.122.gate_proj.weight_scale": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.122.up_proj.weight": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.122.up_proj.weight_scale": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.123.down_proj.weight": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.123.down_proj.weight_scale": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.123.gate_proj.weight": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.123.gate_proj.weight_scale": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.123.up_proj.weight": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.123.up_proj.weight_scale": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.124.down_proj.weight": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.124.down_proj.weight_scale": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.124.gate_proj.weight": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.124.gate_proj.weight_scale": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.124.up_proj.weight": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.124.up_proj.weight_scale": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.125.down_proj.weight": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.125.down_proj.weight_scale": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.125.gate_proj.weight": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.125.gate_proj.weight_scale": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.125.up_proj.weight": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.125.up_proj.weight_scale": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.126.down_proj.weight": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.126.down_proj.weight_scale": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.126.gate_proj.weight": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.126.gate_proj.weight_scale": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.126.up_proj.weight": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.126.up_proj.weight_scale": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.127.down_proj.weight": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.127.down_proj.weight_scale": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.127.gate_proj.weight": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.127.gate_proj.weight_scale": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.127.up_proj.weight": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.127.up_proj.weight_scale": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.128.down_proj.weight": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.128.down_proj.weight_scale": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.128.gate_proj.weight": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.128.gate_proj.weight_scale": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.128.up_proj.weight": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.128.up_proj.weight_scale": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.129.down_proj.weight": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.129.down_proj.weight_scale": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.129.gate_proj.weight": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.129.gate_proj.weight_scale": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.129.up_proj.weight": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.129.up_proj.weight_scale": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.13.down_proj.weight": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.13.down_proj.weight_scale": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.13.gate_proj.weight": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.13.gate_proj.weight_scale": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.13.up_proj.weight": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.13.up_proj.weight_scale": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.130.down_proj.weight": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.130.down_proj.weight_scale": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.130.gate_proj.weight": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.130.gate_proj.weight_scale": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.130.up_proj.weight": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.130.up_proj.weight_scale": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.131.down_proj.weight": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.131.down_proj.weight_scale": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.131.gate_proj.weight": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.131.gate_proj.weight_scale": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.131.up_proj.weight": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.131.up_proj.weight_scale": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.132.down_proj.weight": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.132.down_proj.weight_scale": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.132.gate_proj.weight": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.132.gate_proj.weight_scale": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.132.up_proj.weight": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.132.up_proj.weight_scale": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.133.down_proj.weight": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.133.down_proj.weight_scale": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.133.gate_proj.weight": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.133.gate_proj.weight_scale": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.133.up_proj.weight": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.133.up_proj.weight_scale": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.134.down_proj.weight": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.134.down_proj.weight_scale": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.134.gate_proj.weight": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.134.gate_proj.weight_scale": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.134.up_proj.weight": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.134.up_proj.weight_scale": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.135.down_proj.weight": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.135.down_proj.weight_scale": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.135.gate_proj.weight": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.135.gate_proj.weight_scale": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.135.up_proj.weight": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.135.up_proj.weight_scale": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.136.down_proj.weight": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.136.down_proj.weight_scale": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.136.gate_proj.weight": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.136.gate_proj.weight_scale": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.136.up_proj.weight": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.136.up_proj.weight_scale": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.137.down_proj.weight": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.137.down_proj.weight_scale": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.137.gate_proj.weight": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.137.gate_proj.weight_scale": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.137.up_proj.weight": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.137.up_proj.weight_scale": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.138.down_proj.weight": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.138.down_proj.weight_scale": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.138.gate_proj.weight": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.138.gate_proj.weight_scale": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.138.up_proj.weight": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.138.up_proj.weight_scale": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.139.down_proj.weight": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.139.down_proj.weight_scale": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.139.gate_proj.weight": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.139.gate_proj.weight_scale": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.139.up_proj.weight": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.139.up_proj.weight_scale": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.14.down_proj.weight": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.14.down_proj.weight_scale": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.14.gate_proj.weight": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.14.gate_proj.weight_scale": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.14.up_proj.weight": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.14.up_proj.weight_scale": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.140.down_proj.weight": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.140.down_proj.weight_scale": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.140.gate_proj.weight": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.140.gate_proj.weight_scale": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.140.up_proj.weight": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.140.up_proj.weight_scale": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.141.down_proj.weight": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.141.down_proj.weight_scale": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.141.gate_proj.weight": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.141.gate_proj.weight_scale": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.141.up_proj.weight": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.141.up_proj.weight_scale": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.142.down_proj.weight": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.142.down_proj.weight_scale": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.142.gate_proj.weight": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.142.gate_proj.weight_scale": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.142.up_proj.weight": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.142.up_proj.weight_scale": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.143.down_proj.weight": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.143.down_proj.weight_scale": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.143.gate_proj.weight": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.143.gate_proj.weight_scale": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.143.up_proj.weight": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.143.up_proj.weight_scale": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.144.down_proj.weight": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.144.down_proj.weight_scale": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.144.gate_proj.weight": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.144.gate_proj.weight_scale": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.144.up_proj.weight": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.144.up_proj.weight_scale": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.145.down_proj.weight": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.145.down_proj.weight_scale": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.145.gate_proj.weight": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.145.gate_proj.weight_scale": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.145.up_proj.weight": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.145.up_proj.weight_scale": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.146.down_proj.weight": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.146.down_proj.weight_scale": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.146.gate_proj.weight": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.146.gate_proj.weight_scale": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.146.up_proj.weight": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.146.up_proj.weight_scale": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.147.down_proj.weight": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.147.down_proj.weight_scale": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.147.gate_proj.weight": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.147.gate_proj.weight_scale": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.147.up_proj.weight": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.147.up_proj.weight_scale": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.148.down_proj.weight": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.148.down_proj.weight_scale": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.148.gate_proj.weight": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.148.gate_proj.weight_scale": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.148.up_proj.weight": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.148.up_proj.weight_scale": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.149.down_proj.weight": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.149.down_proj.weight_scale": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.149.gate_proj.weight": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.149.gate_proj.weight_scale": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.149.up_proj.weight": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.149.up_proj.weight_scale": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.15.down_proj.weight": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.15.down_proj.weight_scale": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.15.gate_proj.weight": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.15.gate_proj.weight_scale": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.15.up_proj.weight": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.15.up_proj.weight_scale": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.150.down_proj.weight": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.150.down_proj.weight_scale": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.150.gate_proj.weight": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.150.gate_proj.weight_scale": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.150.up_proj.weight": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.150.up_proj.weight_scale": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.151.down_proj.weight": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.151.down_proj.weight_scale": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.151.gate_proj.weight": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.151.gate_proj.weight_scale": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.151.up_proj.weight": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.151.up_proj.weight_scale": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.152.down_proj.weight": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.152.down_proj.weight_scale": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.152.gate_proj.weight": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.152.gate_proj.weight_scale": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.152.up_proj.weight": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.152.up_proj.weight_scale": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.153.down_proj.weight": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.153.down_proj.weight_scale": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.153.gate_proj.weight": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.153.gate_proj.weight_scale": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.153.up_proj.weight": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.153.up_proj.weight_scale": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.154.down_proj.weight": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.154.down_proj.weight_scale": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.154.gate_proj.weight": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.154.gate_proj.weight_scale": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.154.up_proj.weight": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.154.up_proj.weight_scale": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.155.down_proj.weight": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.155.down_proj.weight_scale": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.155.gate_proj.weight": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.155.gate_proj.weight_scale": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.155.up_proj.weight": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.155.up_proj.weight_scale": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.156.down_proj.weight": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.156.down_proj.weight_scale": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.156.gate_proj.weight": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.156.gate_proj.weight_scale": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.156.up_proj.weight": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.156.up_proj.weight_scale": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.157.down_proj.weight": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.157.down_proj.weight_scale": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.157.gate_proj.weight": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.157.gate_proj.weight_scale": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.157.up_proj.weight": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.157.up_proj.weight_scale": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.158.down_proj.weight": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.158.down_proj.weight_scale": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.158.gate_proj.weight": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.158.gate_proj.weight_scale": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.158.up_proj.weight": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.158.up_proj.weight_scale": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.159.down_proj.weight": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.159.down_proj.weight_scale": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.159.gate_proj.weight": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.159.gate_proj.weight_scale": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.159.up_proj.weight": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.159.up_proj.weight_scale": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.16.down_proj.weight": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.16.down_proj.weight_scale": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.16.gate_proj.weight": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.16.gate_proj.weight_scale": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.16.up_proj.weight": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.16.up_proj.weight_scale": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.17.down_proj.weight": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.17.down_proj.weight_scale": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.17.gate_proj.weight": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.17.gate_proj.weight_scale": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.17.up_proj.weight": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.17.up_proj.weight_scale": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.18.down_proj.weight": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.18.down_proj.weight_scale": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.18.gate_proj.weight": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.18.gate_proj.weight_scale": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.18.up_proj.weight": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.18.up_proj.weight_scale": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.19.down_proj.weight": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.19.down_proj.weight_scale": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.19.gate_proj.weight": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.19.gate_proj.weight_scale": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.19.up_proj.weight": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.19.up_proj.weight_scale": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.2.down_proj.weight": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.2.down_proj.weight_scale": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.2.gate_proj.weight": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.2.gate_proj.weight_scale": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.2.up_proj.weight": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.2.up_proj.weight_scale": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.20.down_proj.weight": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.20.down_proj.weight_scale": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.20.gate_proj.weight": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.20.gate_proj.weight_scale": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.20.up_proj.weight": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.20.up_proj.weight_scale": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.21.down_proj.weight": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.21.down_proj.weight_scale": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.21.gate_proj.weight": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.21.gate_proj.weight_scale": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.21.up_proj.weight": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.21.up_proj.weight_scale": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.22.down_proj.weight": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.22.down_proj.weight_scale": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.22.gate_proj.weight": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.22.gate_proj.weight_scale": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.22.up_proj.weight": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.22.up_proj.weight_scale": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.23.down_proj.weight": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.23.down_proj.weight_scale": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.23.gate_proj.weight": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.23.gate_proj.weight_scale": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.23.up_proj.weight": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.23.up_proj.weight_scale": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.24.down_proj.weight": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.24.down_proj.weight_scale": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.24.gate_proj.weight": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.24.gate_proj.weight_scale": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.24.up_proj.weight": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.24.up_proj.weight_scale": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.25.down_proj.weight": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.25.down_proj.weight_scale": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.25.gate_proj.weight": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.25.gate_proj.weight_scale": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.25.up_proj.weight": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.25.up_proj.weight_scale": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.26.down_proj.weight": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.26.down_proj.weight_scale": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.26.gate_proj.weight": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.26.gate_proj.weight_scale": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.26.up_proj.weight": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.26.up_proj.weight_scale": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.27.down_proj.weight": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.27.down_proj.weight_scale": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.27.gate_proj.weight": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.27.gate_proj.weight_scale": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.27.up_proj.weight": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.27.up_proj.weight_scale": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.28.down_proj.weight": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.28.down_proj.weight_scale": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.28.gate_proj.weight": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.28.gate_proj.weight_scale": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.28.up_proj.weight": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.28.up_proj.weight_scale": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.29.down_proj.weight": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.29.down_proj.weight_scale": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.29.gate_proj.weight": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.29.gate_proj.weight_scale": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.29.up_proj.weight": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.29.up_proj.weight_scale": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.3.down_proj.weight": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.3.down_proj.weight_scale": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.3.gate_proj.weight": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.3.gate_proj.weight_scale": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.3.up_proj.weight": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.3.up_proj.weight_scale": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.30.down_proj.weight": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.30.down_proj.weight_scale": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.30.gate_proj.weight": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.30.gate_proj.weight_scale": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.30.up_proj.weight": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.30.up_proj.weight_scale": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.31.down_proj.weight": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.31.down_proj.weight_scale": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.31.gate_proj.weight": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.31.gate_proj.weight_scale": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.31.up_proj.weight": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.31.up_proj.weight_scale": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.32.down_proj.weight": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.32.down_proj.weight_scale": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.32.gate_proj.weight": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.32.gate_proj.weight_scale": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.32.up_proj.weight": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.32.up_proj.weight_scale": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.33.down_proj.weight": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.33.down_proj.weight_scale": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.33.gate_proj.weight": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.33.gate_proj.weight_scale": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.33.up_proj.weight": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.33.up_proj.weight_scale": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.34.down_proj.weight": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.34.down_proj.weight_scale": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.34.gate_proj.weight": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.34.gate_proj.weight_scale": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.34.up_proj.weight": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.34.up_proj.weight_scale": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.35.down_proj.weight": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.35.down_proj.weight_scale": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.35.gate_proj.weight": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.35.gate_proj.weight_scale": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.35.up_proj.weight": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.35.up_proj.weight_scale": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.36.down_proj.weight": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.36.down_proj.weight_scale": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.36.gate_proj.weight": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.36.gate_proj.weight_scale": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.36.up_proj.weight": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.36.up_proj.weight_scale": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.37.down_proj.weight": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.37.down_proj.weight_scale": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.37.gate_proj.weight": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.37.gate_proj.weight_scale": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.37.up_proj.weight": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.37.up_proj.weight_scale": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.38.down_proj.weight": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.38.down_proj.weight_scale": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.38.gate_proj.weight": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.38.gate_proj.weight_scale": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.38.up_proj.weight": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.38.up_proj.weight_scale": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.39.down_proj.weight": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.39.down_proj.weight_scale": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.39.gate_proj.weight": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.39.gate_proj.weight_scale": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.39.up_proj.weight": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.39.up_proj.weight_scale": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.4.down_proj.weight": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.4.down_proj.weight_scale": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.4.gate_proj.weight": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.4.gate_proj.weight_scale": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.4.up_proj.weight": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.4.up_proj.weight_scale": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.40.down_proj.weight": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.40.down_proj.weight_scale": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.40.gate_proj.weight": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.40.gate_proj.weight_scale": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.40.up_proj.weight": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.40.up_proj.weight_scale": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.41.down_proj.weight": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.41.down_proj.weight_scale": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.41.gate_proj.weight": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.41.gate_proj.weight_scale": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.41.up_proj.weight": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.41.up_proj.weight_scale": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.42.down_proj.weight": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.42.down_proj.weight_scale": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.42.gate_proj.weight": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.42.gate_proj.weight_scale": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.42.up_proj.weight": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.42.up_proj.weight_scale": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.43.down_proj.weight": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.43.down_proj.weight_scale": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.43.gate_proj.weight": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.43.gate_proj.weight_scale": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.43.up_proj.weight": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.43.up_proj.weight_scale": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.44.down_proj.weight": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.44.down_proj.weight_scale": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.44.gate_proj.weight": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.44.gate_proj.weight_scale": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.44.up_proj.weight": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.44.up_proj.weight_scale": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.45.down_proj.weight": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.45.down_proj.weight_scale": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.45.gate_proj.weight": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.45.gate_proj.weight_scale": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.45.up_proj.weight": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.45.up_proj.weight_scale": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.46.down_proj.weight": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.46.down_proj.weight_scale": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.46.gate_proj.weight": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.46.gate_proj.weight_scale": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.46.up_proj.weight": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.46.up_proj.weight_scale": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.47.down_proj.weight": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.47.down_proj.weight_scale": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.47.gate_proj.weight": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.47.gate_proj.weight_scale": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.47.up_proj.weight": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.47.up_proj.weight_scale": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.48.down_proj.weight": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.48.down_proj.weight_scale": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.48.gate_proj.weight": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.48.gate_proj.weight_scale": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.48.up_proj.weight": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.48.up_proj.weight_scale": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.49.down_proj.weight": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.49.down_proj.weight_scale": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.49.gate_proj.weight": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.49.gate_proj.weight_scale": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.49.up_proj.weight": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.49.up_proj.weight_scale": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.5.down_proj.weight": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.5.down_proj.weight_scale": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.5.gate_proj.weight": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.5.gate_proj.weight_scale": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.5.up_proj.weight": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.5.up_proj.weight_scale": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.50.down_proj.weight": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.50.down_proj.weight_scale": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.50.gate_proj.weight": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.50.gate_proj.weight_scale": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.50.up_proj.weight": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.50.up_proj.weight_scale": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.51.down_proj.weight": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.51.down_proj.weight_scale": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.51.gate_proj.weight": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.51.gate_proj.weight_scale": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.51.up_proj.weight": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.51.up_proj.weight_scale": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.52.down_proj.weight": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.52.down_proj.weight_scale": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.52.gate_proj.weight": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.52.gate_proj.weight_scale": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.52.up_proj.weight": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.52.up_proj.weight_scale": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.53.down_proj.weight": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.53.down_proj.weight_scale": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.53.gate_proj.weight": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.53.gate_proj.weight_scale": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.53.up_proj.weight": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.53.up_proj.weight_scale": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.54.down_proj.weight": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.54.down_proj.weight_scale": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.54.gate_proj.weight": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.54.gate_proj.weight_scale": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.54.up_proj.weight": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.54.up_proj.weight_scale": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.55.down_proj.weight": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.55.down_proj.weight_scale": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.55.gate_proj.weight": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.55.gate_proj.weight_scale": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.55.up_proj.weight": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.55.up_proj.weight_scale": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.56.down_proj.weight": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.56.down_proj.weight_scale": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.56.gate_proj.weight": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.56.gate_proj.weight_scale": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.56.up_proj.weight": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.56.up_proj.weight_scale": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.57.down_proj.weight": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.57.down_proj.weight_scale": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.57.gate_proj.weight": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.57.gate_proj.weight_scale": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.57.up_proj.weight": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.57.up_proj.weight_scale": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.58.down_proj.weight": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.58.down_proj.weight_scale": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.58.gate_proj.weight": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.58.gate_proj.weight_scale": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.58.up_proj.weight": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.58.up_proj.weight_scale": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.59.down_proj.weight": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.59.down_proj.weight_scale": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.59.gate_proj.weight": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.59.gate_proj.weight_scale": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.59.up_proj.weight": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.59.up_proj.weight_scale": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.6.down_proj.weight": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.6.down_proj.weight_scale": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.6.gate_proj.weight": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.6.gate_proj.weight_scale": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.6.up_proj.weight": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.6.up_proj.weight_scale": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.60.down_proj.weight": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.60.down_proj.weight_scale": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.60.gate_proj.weight": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.60.gate_proj.weight_scale": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.60.up_proj.weight": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.60.up_proj.weight_scale": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.61.down_proj.weight": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.61.down_proj.weight_scale": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.61.gate_proj.weight": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.61.gate_proj.weight_scale": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.61.up_proj.weight": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.61.up_proj.weight_scale": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.62.down_proj.weight": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.62.down_proj.weight_scale": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.62.gate_proj.weight": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.62.gate_proj.weight_scale": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.62.up_proj.weight": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.62.up_proj.weight_scale": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.63.down_proj.weight": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.63.down_proj.weight_scale": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.63.gate_proj.weight": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.63.gate_proj.weight_scale": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.63.up_proj.weight": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.63.up_proj.weight_scale": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.64.down_proj.weight": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.64.down_proj.weight_scale": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.64.gate_proj.weight": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.64.gate_proj.weight_scale": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.64.up_proj.weight": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.64.up_proj.weight_scale": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.65.down_proj.weight": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.65.down_proj.weight_scale": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.65.gate_proj.weight": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.65.gate_proj.weight_scale": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.65.up_proj.weight": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.65.up_proj.weight_scale": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.66.down_proj.weight": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.66.down_proj.weight_scale": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.66.gate_proj.weight": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.66.gate_proj.weight_scale": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.66.up_proj.weight": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.66.up_proj.weight_scale": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.67.down_proj.weight": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.67.down_proj.weight_scale": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.67.gate_proj.weight": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.67.gate_proj.weight_scale": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.67.up_proj.weight": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.67.up_proj.weight_scale": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.68.down_proj.weight": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.68.down_proj.weight_scale": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.68.gate_proj.weight": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.68.gate_proj.weight_scale": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.68.up_proj.weight": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.68.up_proj.weight_scale": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.69.down_proj.weight": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.69.down_proj.weight_scale": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.69.gate_proj.weight": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.69.gate_proj.weight_scale": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.69.up_proj.weight": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.69.up_proj.weight_scale": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.7.down_proj.weight": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.7.down_proj.weight_scale": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.7.gate_proj.weight": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.7.gate_proj.weight_scale": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.7.up_proj.weight": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.7.up_proj.weight_scale": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.70.down_proj.weight": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.70.down_proj.weight_scale": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.70.gate_proj.weight": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.70.gate_proj.weight_scale": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.70.up_proj.weight": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.70.up_proj.weight_scale": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.71.down_proj.weight": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.71.down_proj.weight_scale": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.71.gate_proj.weight": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.71.gate_proj.weight_scale": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.71.up_proj.weight": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.71.up_proj.weight_scale": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.72.down_proj.weight": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.72.down_proj.weight_scale": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.72.gate_proj.weight": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.72.gate_proj.weight_scale": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.72.up_proj.weight": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.72.up_proj.weight_scale": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.73.down_proj.weight": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.73.down_proj.weight_scale": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.73.gate_proj.weight": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.73.gate_proj.weight_scale": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.73.up_proj.weight": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.73.up_proj.weight_scale": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.74.down_proj.weight": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.74.down_proj.weight_scale": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.74.gate_proj.weight": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.74.gate_proj.weight_scale": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.74.up_proj.weight": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.74.up_proj.weight_scale": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.75.down_proj.weight": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.75.down_proj.weight_scale": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.75.gate_proj.weight": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.75.gate_proj.weight_scale": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.75.up_proj.weight": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.75.up_proj.weight_scale": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.76.down_proj.weight": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.76.down_proj.weight_scale": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.76.gate_proj.weight": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.76.gate_proj.weight_scale": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.76.up_proj.weight": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.76.up_proj.weight_scale": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.77.down_proj.weight": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.77.down_proj.weight_scale": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.77.gate_proj.weight": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.77.gate_proj.weight_scale": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.77.up_proj.weight": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.77.up_proj.weight_scale": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.78.down_proj.weight": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.78.down_proj.weight_scale": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.78.gate_proj.weight": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.78.gate_proj.weight_scale": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.78.up_proj.weight": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.78.up_proj.weight_scale": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.79.down_proj.weight": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.79.down_proj.weight_scale": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.79.gate_proj.weight": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.79.gate_proj.weight_scale": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.79.up_proj.weight": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.79.up_proj.weight_scale": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.8.down_proj.weight": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.8.down_proj.weight_scale": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.8.gate_proj.weight": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.8.gate_proj.weight_scale": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.8.up_proj.weight": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.8.up_proj.weight_scale": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.80.down_proj.weight": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.80.down_proj.weight_scale": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.80.gate_proj.weight": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.80.gate_proj.weight_scale": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.80.up_proj.weight": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.80.up_proj.weight_scale": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.81.down_proj.weight": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.81.down_proj.weight_scale": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.81.gate_proj.weight": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.81.gate_proj.weight_scale": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.81.up_proj.weight": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.81.up_proj.weight_scale": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.82.down_proj.weight": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.82.down_proj.weight_scale": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.82.gate_proj.weight": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.82.gate_proj.weight_scale": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.82.up_proj.weight": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.82.up_proj.weight_scale": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.83.down_proj.weight": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.83.down_proj.weight_scale": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.83.gate_proj.weight": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.83.gate_proj.weight_scale": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.83.up_proj.weight": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.83.up_proj.weight_scale": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.84.down_proj.weight": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.84.down_proj.weight_scale": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.84.gate_proj.weight": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.84.gate_proj.weight_scale": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.84.up_proj.weight": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.84.up_proj.weight_scale": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.85.down_proj.weight": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.85.down_proj.weight_scale": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.85.gate_proj.weight": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.85.gate_proj.weight_scale": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.85.up_proj.weight": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.85.up_proj.weight_scale": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.86.down_proj.weight": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.86.down_proj.weight_scale": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.86.gate_proj.weight": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.86.gate_proj.weight_scale": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.86.up_proj.weight": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.86.up_proj.weight_scale": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.87.down_proj.weight": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.87.down_proj.weight_scale": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.87.gate_proj.weight": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.87.gate_proj.weight_scale": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.87.up_proj.weight": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.87.up_proj.weight_scale": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.88.down_proj.weight": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.88.down_proj.weight_scale": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.88.gate_proj.weight": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.88.gate_proj.weight_scale": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.88.up_proj.weight": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.88.up_proj.weight_scale": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.89.down_proj.weight": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.89.down_proj.weight_scale": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.89.gate_proj.weight": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.89.gate_proj.weight_scale": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.89.up_proj.weight": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.89.up_proj.weight_scale": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.9.down_proj.weight": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.9.down_proj.weight_scale": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.9.gate_proj.weight": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.9.gate_proj.weight_scale": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.9.up_proj.weight": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.9.up_proj.weight_scale": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.90.down_proj.weight": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.90.down_proj.weight_scale": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.90.gate_proj.weight": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.90.gate_proj.weight_scale": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.90.up_proj.weight": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.90.up_proj.weight_scale": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.91.down_proj.weight": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.91.down_proj.weight_scale": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.91.gate_proj.weight": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.91.gate_proj.weight_scale": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.91.up_proj.weight": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.91.up_proj.weight_scale": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.92.down_proj.weight": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.92.down_proj.weight_scale": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.92.gate_proj.weight": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.92.gate_proj.weight_scale": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.92.up_proj.weight": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.92.up_proj.weight_scale": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.93.down_proj.weight": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.93.down_proj.weight_scale": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.93.gate_proj.weight": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.93.gate_proj.weight_scale": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.93.up_proj.weight": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.93.up_proj.weight_scale": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.94.down_proj.weight": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.94.down_proj.weight_scale": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.94.gate_proj.weight": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.94.gate_proj.weight_scale": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.94.up_proj.weight": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.94.up_proj.weight_scale": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.95.down_proj.weight": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.95.down_proj.weight_scale": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.95.gate_proj.weight": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.95.gate_proj.weight_scale": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.95.up_proj.weight": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.95.up_proj.weight_scale": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.96.down_proj.weight": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.96.down_proj.weight_scale": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.96.gate_proj.weight": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.96.gate_proj.weight_scale": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.96.up_proj.weight": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.96.up_proj.weight_scale": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.97.down_proj.weight": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.97.down_proj.weight_scale": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.97.gate_proj.weight": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.97.gate_proj.weight_scale": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.97.up_proj.weight": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.97.up_proj.weight_scale": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.98.down_proj.weight": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.98.down_proj.weight_scale": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.98.gate_proj.weight": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.98.gate_proj.weight_scale": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.98.up_proj.weight": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.98.up_proj.weight_scale": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.99.down_proj.weight": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.99.down_proj.weight_scale": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.99.gate_proj.weight": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.99.gate_proj.weight_scale": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.99.up_proj.weight": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.99.up_proj.weight_scale": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.gate.e_score_correction_bias": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.gate.weight": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.shared_experts.down_proj.weight": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.shared_experts.down_proj.weight_scale": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.shared_experts.gate_proj.weight": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.shared_experts.gate_proj.weight_scale": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.shared_experts.up_proj.weight": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.shared_experts.up_proj.weight_scale": "model-00012-of-00092.safetensors",
+ "model.layers.11.post_attention_layernorm.weight": "model-00012-of-00092.safetensors",
+ "model.layers.11.self_attn.k_norm.weight": "model-00012-of-00092.safetensors",
+ "model.layers.11.self_attn.k_proj.bias": "model-00012-of-00092.safetensors",
+ "model.layers.11.self_attn.k_proj.weight": "model-00012-of-00092.safetensors",
+ "model.layers.11.self_attn.k_proj.weight_scale": "model-00012-of-00092.safetensors",
+ "model.layers.11.self_attn.o_proj.weight": "model-00012-of-00092.safetensors",
+ "model.layers.11.self_attn.o_proj.weight_scale": "model-00012-of-00092.safetensors",
+ "model.layers.11.self_attn.q_norm.weight": "model-00012-of-00092.safetensors",
+ "model.layers.11.self_attn.q_proj.bias": "model-00012-of-00092.safetensors",
+ "model.layers.11.self_attn.q_proj.weight": "model-00012-of-00092.safetensors",
+ "model.layers.11.self_attn.q_proj.weight_scale": "model-00012-of-00092.safetensors",
+ "model.layers.11.self_attn.v_proj.bias": "model-00012-of-00092.safetensors",
+ "model.layers.11.self_attn.v_proj.weight": "model-00012-of-00092.safetensors",
+ "model.layers.11.self_attn.v_proj.weight_scale": "model-00012-of-00092.safetensors",
+ "model.layers.12.input_layernorm.weight": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.0.down_proj.weight": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.0.down_proj.weight_scale": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.0.gate_proj.weight": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.0.gate_proj.weight_scale": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.0.up_proj.weight": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.0.up_proj.weight_scale": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.1.down_proj.weight": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.1.down_proj.weight_scale": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.1.gate_proj.weight": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.1.gate_proj.weight_scale": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.1.up_proj.weight": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.1.up_proj.weight_scale": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.10.down_proj.weight": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.10.down_proj.weight_scale": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.10.gate_proj.weight": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.10.gate_proj.weight_scale": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.10.up_proj.weight": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.10.up_proj.weight_scale": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.100.down_proj.weight": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.100.down_proj.weight_scale": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.100.gate_proj.weight": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.100.gate_proj.weight_scale": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.100.up_proj.weight": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.100.up_proj.weight_scale": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.101.down_proj.weight": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.101.down_proj.weight_scale": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.101.gate_proj.weight": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.101.gate_proj.weight_scale": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.101.up_proj.weight": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.101.up_proj.weight_scale": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.102.down_proj.weight": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.102.down_proj.weight_scale": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.102.gate_proj.weight": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.102.gate_proj.weight_scale": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.102.up_proj.weight": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.102.up_proj.weight_scale": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.103.down_proj.weight": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.103.down_proj.weight_scale": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.103.gate_proj.weight": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.103.gate_proj.weight_scale": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.103.up_proj.weight": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.103.up_proj.weight_scale": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.104.down_proj.weight": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.104.down_proj.weight_scale": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.104.gate_proj.weight": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.104.gate_proj.weight_scale": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.104.up_proj.weight": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.104.up_proj.weight_scale": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.105.down_proj.weight": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.105.down_proj.weight_scale": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.105.gate_proj.weight": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.105.gate_proj.weight_scale": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.105.up_proj.weight": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.105.up_proj.weight_scale": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.106.down_proj.weight": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.106.down_proj.weight_scale": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.106.gate_proj.weight": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.106.gate_proj.weight_scale": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.106.up_proj.weight": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.106.up_proj.weight_scale": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.107.down_proj.weight": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.107.down_proj.weight_scale": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.107.gate_proj.weight": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.107.gate_proj.weight_scale": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.107.up_proj.weight": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.107.up_proj.weight_scale": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.108.down_proj.weight": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.108.down_proj.weight_scale": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.108.gate_proj.weight": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.108.gate_proj.weight_scale": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.108.up_proj.weight": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.108.up_proj.weight_scale": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.109.down_proj.weight": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.109.down_proj.weight_scale": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.109.gate_proj.weight": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.109.gate_proj.weight_scale": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.109.up_proj.weight": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.109.up_proj.weight_scale": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.11.down_proj.weight": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.11.down_proj.weight_scale": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.11.gate_proj.weight": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.11.gate_proj.weight_scale": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.11.up_proj.weight": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.11.up_proj.weight_scale": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.110.down_proj.weight": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.110.down_proj.weight_scale": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.110.gate_proj.weight": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.110.gate_proj.weight_scale": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.110.up_proj.weight": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.110.up_proj.weight_scale": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.111.down_proj.weight": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.111.down_proj.weight_scale": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.111.gate_proj.weight": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.111.gate_proj.weight_scale": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.111.up_proj.weight": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.111.up_proj.weight_scale": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.112.down_proj.weight": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.112.down_proj.weight_scale": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.112.gate_proj.weight": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.112.gate_proj.weight_scale": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.112.up_proj.weight": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.112.up_proj.weight_scale": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.113.down_proj.weight": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.113.down_proj.weight_scale": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.113.gate_proj.weight": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.113.gate_proj.weight_scale": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.113.up_proj.weight": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.113.up_proj.weight_scale": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.114.down_proj.weight": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.114.down_proj.weight_scale": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.114.gate_proj.weight": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.114.gate_proj.weight_scale": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.114.up_proj.weight": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.114.up_proj.weight_scale": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.115.down_proj.weight": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.115.down_proj.weight_scale": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.115.gate_proj.weight": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.115.gate_proj.weight_scale": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.115.up_proj.weight": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.115.up_proj.weight_scale": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.116.down_proj.weight": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.116.down_proj.weight_scale": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.116.gate_proj.weight": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.116.gate_proj.weight_scale": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.116.up_proj.weight": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.116.up_proj.weight_scale": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.117.down_proj.weight": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.117.down_proj.weight_scale": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.117.gate_proj.weight": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.117.gate_proj.weight_scale": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.117.up_proj.weight": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.117.up_proj.weight_scale": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.118.down_proj.weight": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.118.down_proj.weight_scale": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.118.gate_proj.weight": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.118.gate_proj.weight_scale": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.118.up_proj.weight": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.118.up_proj.weight_scale": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.119.down_proj.weight": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.119.down_proj.weight_scale": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.119.gate_proj.weight": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.119.gate_proj.weight_scale": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.119.up_proj.weight": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.119.up_proj.weight_scale": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.12.down_proj.weight": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.12.down_proj.weight_scale": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.12.gate_proj.weight": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.12.gate_proj.weight_scale": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.12.up_proj.weight": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.12.up_proj.weight_scale": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.120.down_proj.weight": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.120.down_proj.weight_scale": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.120.gate_proj.weight": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.120.gate_proj.weight_scale": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.120.up_proj.weight": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.120.up_proj.weight_scale": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.121.down_proj.weight": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.121.down_proj.weight_scale": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.121.gate_proj.weight": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.121.gate_proj.weight_scale": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.121.up_proj.weight": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.121.up_proj.weight_scale": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.122.down_proj.weight": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.122.down_proj.weight_scale": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.122.gate_proj.weight": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.122.gate_proj.weight_scale": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.122.up_proj.weight": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.122.up_proj.weight_scale": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.123.down_proj.weight": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.123.down_proj.weight_scale": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.123.gate_proj.weight": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.123.gate_proj.weight_scale": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.123.up_proj.weight": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.123.up_proj.weight_scale": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.124.down_proj.weight": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.124.down_proj.weight_scale": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.124.gate_proj.weight": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.124.gate_proj.weight_scale": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.124.up_proj.weight": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.124.up_proj.weight_scale": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.125.down_proj.weight": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.125.down_proj.weight_scale": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.125.gate_proj.weight": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.125.gate_proj.weight_scale": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.125.up_proj.weight": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.125.up_proj.weight_scale": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.126.down_proj.weight": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.126.down_proj.weight_scale": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.126.gate_proj.weight": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.126.gate_proj.weight_scale": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.126.up_proj.weight": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.126.up_proj.weight_scale": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.127.down_proj.weight": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.127.down_proj.weight_scale": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.127.gate_proj.weight": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.127.gate_proj.weight_scale": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.127.up_proj.weight": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.127.up_proj.weight_scale": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.128.down_proj.weight": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.128.down_proj.weight_scale": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.128.gate_proj.weight": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.128.gate_proj.weight_scale": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.128.up_proj.weight": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.128.up_proj.weight_scale": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.129.down_proj.weight": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.129.down_proj.weight_scale": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.129.gate_proj.weight": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.129.gate_proj.weight_scale": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.129.up_proj.weight": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.129.up_proj.weight_scale": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.13.down_proj.weight": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.13.down_proj.weight_scale": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.13.gate_proj.weight": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.13.gate_proj.weight_scale": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.13.up_proj.weight": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.13.up_proj.weight_scale": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.130.down_proj.weight": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.130.down_proj.weight_scale": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.130.gate_proj.weight": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.130.gate_proj.weight_scale": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.130.up_proj.weight": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.130.up_proj.weight_scale": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.131.down_proj.weight": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.131.down_proj.weight_scale": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.131.gate_proj.weight": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.131.gate_proj.weight_scale": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.131.up_proj.weight": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.131.up_proj.weight_scale": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.132.down_proj.weight": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.132.down_proj.weight_scale": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.132.gate_proj.weight": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.132.gate_proj.weight_scale": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.132.up_proj.weight": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.132.up_proj.weight_scale": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.133.down_proj.weight": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.133.down_proj.weight_scale": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.133.gate_proj.weight": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.133.gate_proj.weight_scale": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.133.up_proj.weight": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.133.up_proj.weight_scale": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.134.down_proj.weight": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.134.down_proj.weight_scale": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.134.gate_proj.weight": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.134.gate_proj.weight_scale": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.134.up_proj.weight": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.134.up_proj.weight_scale": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.135.down_proj.weight": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.135.down_proj.weight_scale": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.135.gate_proj.weight": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.135.gate_proj.weight_scale": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.135.up_proj.weight": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.135.up_proj.weight_scale": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.136.down_proj.weight": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.136.down_proj.weight_scale": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.136.gate_proj.weight": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.136.gate_proj.weight_scale": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.136.up_proj.weight": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.136.up_proj.weight_scale": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.137.down_proj.weight": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.137.down_proj.weight_scale": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.137.gate_proj.weight": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.137.gate_proj.weight_scale": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.137.up_proj.weight": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.137.up_proj.weight_scale": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.138.down_proj.weight": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.138.down_proj.weight_scale": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.138.gate_proj.weight": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.138.gate_proj.weight_scale": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.138.up_proj.weight": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.138.up_proj.weight_scale": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.139.down_proj.weight": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.139.down_proj.weight_scale": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.139.gate_proj.weight": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.139.gate_proj.weight_scale": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.139.up_proj.weight": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.139.up_proj.weight_scale": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.14.down_proj.weight": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.14.down_proj.weight_scale": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.14.gate_proj.weight": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.14.gate_proj.weight_scale": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.14.up_proj.weight": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.14.up_proj.weight_scale": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.140.down_proj.weight": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.140.down_proj.weight_scale": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.140.gate_proj.weight": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.140.gate_proj.weight_scale": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.140.up_proj.weight": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.140.up_proj.weight_scale": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.141.down_proj.weight": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.141.down_proj.weight_scale": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.141.gate_proj.weight": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.141.gate_proj.weight_scale": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.141.up_proj.weight": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.141.up_proj.weight_scale": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.142.down_proj.weight": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.142.down_proj.weight_scale": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.142.gate_proj.weight": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.142.gate_proj.weight_scale": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.142.up_proj.weight": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.142.up_proj.weight_scale": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.143.down_proj.weight": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.143.down_proj.weight_scale": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.143.gate_proj.weight": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.143.gate_proj.weight_scale": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.143.up_proj.weight": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.143.up_proj.weight_scale": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.144.down_proj.weight": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.144.down_proj.weight_scale": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.144.gate_proj.weight": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.144.gate_proj.weight_scale": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.144.up_proj.weight": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.144.up_proj.weight_scale": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.145.down_proj.weight": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.145.down_proj.weight_scale": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.145.gate_proj.weight": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.145.gate_proj.weight_scale": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.145.up_proj.weight": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.145.up_proj.weight_scale": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.146.down_proj.weight": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.146.down_proj.weight_scale": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.146.gate_proj.weight": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.146.gate_proj.weight_scale": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.146.up_proj.weight": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.146.up_proj.weight_scale": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.147.down_proj.weight": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.147.down_proj.weight_scale": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.147.gate_proj.weight": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.147.gate_proj.weight_scale": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.147.up_proj.weight": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.147.up_proj.weight_scale": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.148.down_proj.weight": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.148.down_proj.weight_scale": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.148.gate_proj.weight": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.148.gate_proj.weight_scale": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.148.up_proj.weight": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.148.up_proj.weight_scale": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.149.down_proj.weight": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.149.down_proj.weight_scale": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.149.gate_proj.weight": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.149.gate_proj.weight_scale": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.149.up_proj.weight": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.149.up_proj.weight_scale": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.15.down_proj.weight": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.15.down_proj.weight_scale": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.15.gate_proj.weight": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.15.gate_proj.weight_scale": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.15.up_proj.weight": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.15.up_proj.weight_scale": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.150.down_proj.weight": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.150.down_proj.weight_scale": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.150.gate_proj.weight": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.150.gate_proj.weight_scale": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.150.up_proj.weight": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.150.up_proj.weight_scale": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.151.down_proj.weight": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.151.down_proj.weight_scale": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.151.gate_proj.weight": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.151.gate_proj.weight_scale": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.151.up_proj.weight": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.151.up_proj.weight_scale": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.152.down_proj.weight": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.152.down_proj.weight_scale": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.152.gate_proj.weight": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.152.gate_proj.weight_scale": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.152.up_proj.weight": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.152.up_proj.weight_scale": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.153.down_proj.weight": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.153.down_proj.weight_scale": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.153.gate_proj.weight": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.153.gate_proj.weight_scale": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.153.up_proj.weight": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.153.up_proj.weight_scale": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.154.down_proj.weight": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.154.down_proj.weight_scale": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.154.gate_proj.weight": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.154.gate_proj.weight_scale": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.154.up_proj.weight": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.154.up_proj.weight_scale": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.155.down_proj.weight": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.155.down_proj.weight_scale": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.155.gate_proj.weight": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.155.gate_proj.weight_scale": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.155.up_proj.weight": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.155.up_proj.weight_scale": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.156.down_proj.weight": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.156.down_proj.weight_scale": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.156.gate_proj.weight": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.156.gate_proj.weight_scale": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.156.up_proj.weight": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.156.up_proj.weight_scale": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.157.down_proj.weight": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.157.down_proj.weight_scale": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.157.gate_proj.weight": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.157.gate_proj.weight_scale": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.157.up_proj.weight": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.157.up_proj.weight_scale": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.158.down_proj.weight": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.158.down_proj.weight_scale": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.158.gate_proj.weight": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.158.gate_proj.weight_scale": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.158.up_proj.weight": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.158.up_proj.weight_scale": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.159.down_proj.weight": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.159.down_proj.weight_scale": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.159.gate_proj.weight": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.159.gate_proj.weight_scale": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.159.up_proj.weight": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.159.up_proj.weight_scale": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.16.down_proj.weight": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.16.down_proj.weight_scale": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.16.gate_proj.weight": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.16.gate_proj.weight_scale": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.16.up_proj.weight": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.16.up_proj.weight_scale": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.17.down_proj.weight": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.17.down_proj.weight_scale": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.17.gate_proj.weight": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.17.gate_proj.weight_scale": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.17.up_proj.weight": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.17.up_proj.weight_scale": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.18.down_proj.weight": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.18.down_proj.weight_scale": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.18.gate_proj.weight": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.18.gate_proj.weight_scale": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.18.up_proj.weight": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.18.up_proj.weight_scale": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.19.down_proj.weight": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.19.down_proj.weight_scale": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.19.gate_proj.weight": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.19.gate_proj.weight_scale": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.19.up_proj.weight": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.19.up_proj.weight_scale": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.2.down_proj.weight": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.2.down_proj.weight_scale": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.2.gate_proj.weight": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.2.gate_proj.weight_scale": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.2.up_proj.weight": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.2.up_proj.weight_scale": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.20.down_proj.weight": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.20.down_proj.weight_scale": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.20.gate_proj.weight": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.20.gate_proj.weight_scale": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.20.up_proj.weight": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.20.up_proj.weight_scale": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.21.down_proj.weight": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.21.down_proj.weight_scale": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.21.gate_proj.weight": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.21.gate_proj.weight_scale": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.21.up_proj.weight": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.21.up_proj.weight_scale": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.22.down_proj.weight": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.22.down_proj.weight_scale": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.22.gate_proj.weight": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.22.gate_proj.weight_scale": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.22.up_proj.weight": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.22.up_proj.weight_scale": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.23.down_proj.weight": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.23.down_proj.weight_scale": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.23.gate_proj.weight": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.23.gate_proj.weight_scale": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.23.up_proj.weight": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.23.up_proj.weight_scale": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.24.down_proj.weight": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.24.down_proj.weight_scale": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.24.gate_proj.weight": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.24.gate_proj.weight_scale": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.24.up_proj.weight": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.24.up_proj.weight_scale": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.25.down_proj.weight": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.25.down_proj.weight_scale": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.25.gate_proj.weight": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.25.gate_proj.weight_scale": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.25.up_proj.weight": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.25.up_proj.weight_scale": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.26.down_proj.weight": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.26.down_proj.weight_scale": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.26.gate_proj.weight": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.26.gate_proj.weight_scale": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.26.up_proj.weight": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.26.up_proj.weight_scale": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.27.down_proj.weight": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.27.down_proj.weight_scale": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.27.gate_proj.weight": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.27.gate_proj.weight_scale": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.27.up_proj.weight": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.27.up_proj.weight_scale": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.28.down_proj.weight": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.28.down_proj.weight_scale": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.28.gate_proj.weight": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.28.gate_proj.weight_scale": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.28.up_proj.weight": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.28.up_proj.weight_scale": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.29.down_proj.weight": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.29.down_proj.weight_scale": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.29.gate_proj.weight": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.29.gate_proj.weight_scale": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.29.up_proj.weight": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.29.up_proj.weight_scale": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.3.down_proj.weight": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.3.down_proj.weight_scale": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.3.gate_proj.weight": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.3.gate_proj.weight_scale": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.3.up_proj.weight": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.3.up_proj.weight_scale": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.30.down_proj.weight": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.30.down_proj.weight_scale": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.30.gate_proj.weight": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.30.gate_proj.weight_scale": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.30.up_proj.weight": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.30.up_proj.weight_scale": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.31.down_proj.weight": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.31.down_proj.weight_scale": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.31.gate_proj.weight": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.31.gate_proj.weight_scale": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.31.up_proj.weight": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.31.up_proj.weight_scale": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.32.down_proj.weight": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.32.down_proj.weight_scale": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.32.gate_proj.weight": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.32.gate_proj.weight_scale": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.32.up_proj.weight": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.32.up_proj.weight_scale": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.33.down_proj.weight": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.33.down_proj.weight_scale": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.33.gate_proj.weight": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.33.gate_proj.weight_scale": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.33.up_proj.weight": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.33.up_proj.weight_scale": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.34.down_proj.weight": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.34.down_proj.weight_scale": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.34.gate_proj.weight": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.34.gate_proj.weight_scale": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.34.up_proj.weight": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.34.up_proj.weight_scale": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.35.down_proj.weight": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.35.down_proj.weight_scale": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.35.gate_proj.weight": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.35.gate_proj.weight_scale": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.35.up_proj.weight": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.35.up_proj.weight_scale": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.36.down_proj.weight": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.36.down_proj.weight_scale": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.36.gate_proj.weight": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.36.gate_proj.weight_scale": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.36.up_proj.weight": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.36.up_proj.weight_scale": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.37.down_proj.weight": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.37.down_proj.weight_scale": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.37.gate_proj.weight": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.37.gate_proj.weight_scale": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.37.up_proj.weight": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.37.up_proj.weight_scale": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.38.down_proj.weight": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.38.down_proj.weight_scale": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.38.gate_proj.weight": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.38.gate_proj.weight_scale": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.38.up_proj.weight": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.38.up_proj.weight_scale": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.39.down_proj.weight": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.39.down_proj.weight_scale": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.39.gate_proj.weight": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.39.gate_proj.weight_scale": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.39.up_proj.weight": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.39.up_proj.weight_scale": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.4.down_proj.weight": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.4.down_proj.weight_scale": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.4.gate_proj.weight": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.4.gate_proj.weight_scale": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.4.up_proj.weight": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.4.up_proj.weight_scale": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.40.down_proj.weight": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.40.down_proj.weight_scale": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.40.gate_proj.weight": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.40.gate_proj.weight_scale": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.40.up_proj.weight": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.40.up_proj.weight_scale": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.41.down_proj.weight": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.41.down_proj.weight_scale": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.41.gate_proj.weight": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.41.gate_proj.weight_scale": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.41.up_proj.weight": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.41.up_proj.weight_scale": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.42.down_proj.weight": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.42.down_proj.weight_scale": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.42.gate_proj.weight": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.42.gate_proj.weight_scale": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.42.up_proj.weight": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.42.up_proj.weight_scale": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.43.down_proj.weight": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.43.down_proj.weight_scale": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.43.gate_proj.weight": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.43.gate_proj.weight_scale": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.43.up_proj.weight": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.43.up_proj.weight_scale": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.44.down_proj.weight": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.44.down_proj.weight_scale": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.44.gate_proj.weight": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.44.gate_proj.weight_scale": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.44.up_proj.weight": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.44.up_proj.weight_scale": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.45.down_proj.weight": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.45.down_proj.weight_scale": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.45.gate_proj.weight": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.45.gate_proj.weight_scale": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.45.up_proj.weight": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.45.up_proj.weight_scale": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.46.down_proj.weight": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.46.down_proj.weight_scale": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.46.gate_proj.weight": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.46.gate_proj.weight_scale": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.46.up_proj.weight": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.46.up_proj.weight_scale": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.47.down_proj.weight": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.47.down_proj.weight_scale": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.47.gate_proj.weight": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.47.gate_proj.weight_scale": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.47.up_proj.weight": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.47.up_proj.weight_scale": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.48.down_proj.weight": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.48.down_proj.weight_scale": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.48.gate_proj.weight": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.48.gate_proj.weight_scale": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.48.up_proj.weight": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.48.up_proj.weight_scale": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.49.down_proj.weight": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.49.down_proj.weight_scale": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.49.gate_proj.weight": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.49.gate_proj.weight_scale": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.49.up_proj.weight": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.49.up_proj.weight_scale": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.5.down_proj.weight": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.5.down_proj.weight_scale": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.5.gate_proj.weight": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.5.gate_proj.weight_scale": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.5.up_proj.weight": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.5.up_proj.weight_scale": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.50.down_proj.weight": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.50.down_proj.weight_scale": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.50.gate_proj.weight": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.50.gate_proj.weight_scale": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.50.up_proj.weight": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.50.up_proj.weight_scale": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.51.down_proj.weight": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.51.down_proj.weight_scale": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.51.gate_proj.weight": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.51.gate_proj.weight_scale": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.51.up_proj.weight": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.51.up_proj.weight_scale": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.52.down_proj.weight": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.52.down_proj.weight_scale": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.52.gate_proj.weight": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.52.gate_proj.weight_scale": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.52.up_proj.weight": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.52.up_proj.weight_scale": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.53.down_proj.weight": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.53.down_proj.weight_scale": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.53.gate_proj.weight": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.53.gate_proj.weight_scale": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.53.up_proj.weight": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.53.up_proj.weight_scale": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.54.down_proj.weight": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.54.down_proj.weight_scale": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.54.gate_proj.weight": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.54.gate_proj.weight_scale": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.54.up_proj.weight": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.54.up_proj.weight_scale": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.55.down_proj.weight": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.55.down_proj.weight_scale": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.55.gate_proj.weight": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.55.gate_proj.weight_scale": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.55.up_proj.weight": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.55.up_proj.weight_scale": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.56.down_proj.weight": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.56.down_proj.weight_scale": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.56.gate_proj.weight": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.56.gate_proj.weight_scale": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.56.up_proj.weight": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.56.up_proj.weight_scale": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.57.down_proj.weight": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.57.down_proj.weight_scale": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.57.gate_proj.weight": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.57.gate_proj.weight_scale": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.57.up_proj.weight": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.57.up_proj.weight_scale": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.58.down_proj.weight": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.58.down_proj.weight_scale": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.58.gate_proj.weight": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.58.gate_proj.weight_scale": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.58.up_proj.weight": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.58.up_proj.weight_scale": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.59.down_proj.weight": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.59.down_proj.weight_scale": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.59.gate_proj.weight": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.59.gate_proj.weight_scale": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.59.up_proj.weight": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.59.up_proj.weight_scale": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.6.down_proj.weight": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.6.down_proj.weight_scale": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.6.gate_proj.weight": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.6.gate_proj.weight_scale": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.6.up_proj.weight": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.6.up_proj.weight_scale": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.60.down_proj.weight": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.60.down_proj.weight_scale": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.60.gate_proj.weight": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.60.gate_proj.weight_scale": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.60.up_proj.weight": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.60.up_proj.weight_scale": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.61.down_proj.weight": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.61.down_proj.weight_scale": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.61.gate_proj.weight": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.61.gate_proj.weight_scale": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.61.up_proj.weight": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.61.up_proj.weight_scale": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.62.down_proj.weight": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.62.down_proj.weight_scale": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.62.gate_proj.weight": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.62.gate_proj.weight_scale": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.62.up_proj.weight": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.62.up_proj.weight_scale": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.63.down_proj.weight": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.63.down_proj.weight_scale": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.63.gate_proj.weight": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.63.gate_proj.weight_scale": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.63.up_proj.weight": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.63.up_proj.weight_scale": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.64.down_proj.weight": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.64.down_proj.weight_scale": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.64.gate_proj.weight": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.64.gate_proj.weight_scale": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.64.up_proj.weight": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.64.up_proj.weight_scale": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.65.down_proj.weight": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.65.down_proj.weight_scale": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.65.gate_proj.weight": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.65.gate_proj.weight_scale": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.65.up_proj.weight": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.65.up_proj.weight_scale": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.66.down_proj.weight": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.66.down_proj.weight_scale": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.66.gate_proj.weight": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.66.gate_proj.weight_scale": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.66.up_proj.weight": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.66.up_proj.weight_scale": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.67.down_proj.weight": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.67.down_proj.weight_scale": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.67.gate_proj.weight": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.67.gate_proj.weight_scale": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.67.up_proj.weight": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.67.up_proj.weight_scale": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.68.down_proj.weight": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.68.down_proj.weight_scale": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.68.gate_proj.weight": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.68.gate_proj.weight_scale": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.68.up_proj.weight": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.68.up_proj.weight_scale": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.69.down_proj.weight": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.69.down_proj.weight_scale": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.69.gate_proj.weight": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.69.gate_proj.weight_scale": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.69.up_proj.weight": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.69.up_proj.weight_scale": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.7.down_proj.weight": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.7.down_proj.weight_scale": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.7.gate_proj.weight": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.7.gate_proj.weight_scale": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.7.up_proj.weight": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.7.up_proj.weight_scale": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.70.down_proj.weight": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.70.down_proj.weight_scale": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.70.gate_proj.weight": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.70.gate_proj.weight_scale": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.70.up_proj.weight": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.70.up_proj.weight_scale": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.71.down_proj.weight": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.71.down_proj.weight_scale": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.71.gate_proj.weight": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.71.gate_proj.weight_scale": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.71.up_proj.weight": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.71.up_proj.weight_scale": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.72.down_proj.weight": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.72.down_proj.weight_scale": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.72.gate_proj.weight": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.72.gate_proj.weight_scale": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.72.up_proj.weight": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.72.up_proj.weight_scale": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.73.down_proj.weight": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.73.down_proj.weight_scale": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.73.gate_proj.weight": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.73.gate_proj.weight_scale": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.73.up_proj.weight": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.73.up_proj.weight_scale": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.74.down_proj.weight": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.74.down_proj.weight_scale": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.74.gate_proj.weight": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.74.gate_proj.weight_scale": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.74.up_proj.weight": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.74.up_proj.weight_scale": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.75.down_proj.weight": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.75.down_proj.weight_scale": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.75.gate_proj.weight": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.75.gate_proj.weight_scale": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.75.up_proj.weight": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.75.up_proj.weight_scale": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.76.down_proj.weight": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.76.down_proj.weight_scale": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.76.gate_proj.weight": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.76.gate_proj.weight_scale": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.76.up_proj.weight": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.76.up_proj.weight_scale": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.77.down_proj.weight": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.77.down_proj.weight_scale": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.77.gate_proj.weight": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.77.gate_proj.weight_scale": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.77.up_proj.weight": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.77.up_proj.weight_scale": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.78.down_proj.weight": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.78.down_proj.weight_scale": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.78.gate_proj.weight": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.78.gate_proj.weight_scale": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.78.up_proj.weight": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.78.up_proj.weight_scale": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.79.down_proj.weight": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.79.down_proj.weight_scale": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.79.gate_proj.weight": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.79.gate_proj.weight_scale": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.79.up_proj.weight": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.79.up_proj.weight_scale": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.8.down_proj.weight": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.8.down_proj.weight_scale": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.8.gate_proj.weight": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.8.gate_proj.weight_scale": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.8.up_proj.weight": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.8.up_proj.weight_scale": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.80.down_proj.weight": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.80.down_proj.weight_scale": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.80.gate_proj.weight": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.80.gate_proj.weight_scale": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.80.up_proj.weight": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.80.up_proj.weight_scale": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.81.down_proj.weight": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.81.down_proj.weight_scale": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.81.gate_proj.weight": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.81.gate_proj.weight_scale": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.81.up_proj.weight": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.81.up_proj.weight_scale": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.82.down_proj.weight": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.82.down_proj.weight_scale": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.82.gate_proj.weight": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.82.gate_proj.weight_scale": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.82.up_proj.weight": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.82.up_proj.weight_scale": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.83.down_proj.weight": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.83.down_proj.weight_scale": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.83.gate_proj.weight": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.83.gate_proj.weight_scale": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.83.up_proj.weight": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.83.up_proj.weight_scale": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.84.down_proj.weight": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.84.down_proj.weight_scale": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.84.gate_proj.weight": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.84.gate_proj.weight_scale": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.84.up_proj.weight": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.84.up_proj.weight_scale": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.85.down_proj.weight": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.85.down_proj.weight_scale": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.85.gate_proj.weight": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.85.gate_proj.weight_scale": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.85.up_proj.weight": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.85.up_proj.weight_scale": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.86.down_proj.weight": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.86.down_proj.weight_scale": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.86.gate_proj.weight": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.86.gate_proj.weight_scale": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.86.up_proj.weight": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.86.up_proj.weight_scale": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.87.down_proj.weight": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.87.down_proj.weight_scale": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.87.gate_proj.weight": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.87.gate_proj.weight_scale": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.87.up_proj.weight": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.87.up_proj.weight_scale": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.88.down_proj.weight": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.88.down_proj.weight_scale": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.88.gate_proj.weight": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.88.gate_proj.weight_scale": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.88.up_proj.weight": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.88.up_proj.weight_scale": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.89.down_proj.weight": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.89.down_proj.weight_scale": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.89.gate_proj.weight": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.89.gate_proj.weight_scale": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.89.up_proj.weight": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.89.up_proj.weight_scale": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.9.down_proj.weight": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.9.down_proj.weight_scale": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.9.gate_proj.weight": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.9.gate_proj.weight_scale": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.9.up_proj.weight": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.9.up_proj.weight_scale": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.90.down_proj.weight": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.90.down_proj.weight_scale": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.90.gate_proj.weight": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.90.gate_proj.weight_scale": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.90.up_proj.weight": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.90.up_proj.weight_scale": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.91.down_proj.weight": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.91.down_proj.weight_scale": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.91.gate_proj.weight": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.91.gate_proj.weight_scale": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.91.up_proj.weight": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.91.up_proj.weight_scale": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.92.down_proj.weight": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.92.down_proj.weight_scale": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.92.gate_proj.weight": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.92.gate_proj.weight_scale": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.92.up_proj.weight": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.92.up_proj.weight_scale": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.93.down_proj.weight": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.93.down_proj.weight_scale": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.93.gate_proj.weight": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.93.gate_proj.weight_scale": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.93.up_proj.weight": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.93.up_proj.weight_scale": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.94.down_proj.weight": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.94.down_proj.weight_scale": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.94.gate_proj.weight": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.94.gate_proj.weight_scale": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.94.up_proj.weight": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.94.up_proj.weight_scale": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.95.down_proj.weight": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.95.down_proj.weight_scale": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.95.gate_proj.weight": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.95.gate_proj.weight_scale": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.95.up_proj.weight": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.95.up_proj.weight_scale": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.96.down_proj.weight": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.96.down_proj.weight_scale": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.96.gate_proj.weight": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.96.gate_proj.weight_scale": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.96.up_proj.weight": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.96.up_proj.weight_scale": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.97.down_proj.weight": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.97.down_proj.weight_scale": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.97.gate_proj.weight": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.97.gate_proj.weight_scale": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.97.up_proj.weight": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.97.up_proj.weight_scale": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.98.down_proj.weight": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.98.down_proj.weight_scale": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.98.gate_proj.weight": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.98.gate_proj.weight_scale": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.98.up_proj.weight": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.98.up_proj.weight_scale": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.99.down_proj.weight": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.99.down_proj.weight_scale": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.99.gate_proj.weight": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.99.gate_proj.weight_scale": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.99.up_proj.weight": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.99.up_proj.weight_scale": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.gate.e_score_correction_bias": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.gate.weight": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.shared_experts.down_proj.weight": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.shared_experts.down_proj.weight_scale": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.shared_experts.gate_proj.weight": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.shared_experts.gate_proj.weight_scale": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.shared_experts.up_proj.weight": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.shared_experts.up_proj.weight_scale": "model-00013-of-00092.safetensors",
+ "model.layers.12.post_attention_layernorm.weight": "model-00013-of-00092.safetensors",
+ "model.layers.12.self_attn.k_norm.weight": "model-00013-of-00092.safetensors",
+ "model.layers.12.self_attn.k_proj.bias": "model-00013-of-00092.safetensors",
+ "model.layers.12.self_attn.k_proj.weight": "model-00013-of-00092.safetensors",
+ "model.layers.12.self_attn.k_proj.weight_scale": "model-00013-of-00092.safetensors",
+ "model.layers.12.self_attn.o_proj.weight": "model-00013-of-00092.safetensors",
+ "model.layers.12.self_attn.o_proj.weight_scale": "model-00013-of-00092.safetensors",
+ "model.layers.12.self_attn.q_norm.weight": "model-00013-of-00092.safetensors",
+ "model.layers.12.self_attn.q_proj.bias": "model-00013-of-00092.safetensors",
+ "model.layers.12.self_attn.q_proj.weight": "model-00013-of-00092.safetensors",
+ "model.layers.12.self_attn.q_proj.weight_scale": "model-00013-of-00092.safetensors",
+ "model.layers.12.self_attn.v_proj.bias": "model-00013-of-00092.safetensors",
+ "model.layers.12.self_attn.v_proj.weight": "model-00013-of-00092.safetensors",
+ "model.layers.12.self_attn.v_proj.weight_scale": "model-00013-of-00092.safetensors",
+ "model.layers.13.input_layernorm.weight": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.0.down_proj.weight": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.0.down_proj.weight_scale": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.0.gate_proj.weight": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.0.gate_proj.weight_scale": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.0.up_proj.weight": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.0.up_proj.weight_scale": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.1.down_proj.weight": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.1.down_proj.weight_scale": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.1.gate_proj.weight": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.1.gate_proj.weight_scale": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.1.up_proj.weight": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.1.up_proj.weight_scale": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.10.down_proj.weight": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.10.down_proj.weight_scale": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.10.gate_proj.weight": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.10.gate_proj.weight_scale": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.10.up_proj.weight": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.10.up_proj.weight_scale": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.100.down_proj.weight": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.100.down_proj.weight_scale": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.100.gate_proj.weight": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.100.gate_proj.weight_scale": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.100.up_proj.weight": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.100.up_proj.weight_scale": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.101.down_proj.weight": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.101.down_proj.weight_scale": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.101.gate_proj.weight": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.101.gate_proj.weight_scale": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.101.up_proj.weight": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.101.up_proj.weight_scale": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.102.down_proj.weight": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.102.down_proj.weight_scale": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.102.gate_proj.weight": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.102.gate_proj.weight_scale": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.102.up_proj.weight": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.102.up_proj.weight_scale": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.103.down_proj.weight": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.103.down_proj.weight_scale": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.103.gate_proj.weight": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.103.gate_proj.weight_scale": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.103.up_proj.weight": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.103.up_proj.weight_scale": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.104.down_proj.weight": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.104.down_proj.weight_scale": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.104.gate_proj.weight": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.104.gate_proj.weight_scale": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.104.up_proj.weight": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.104.up_proj.weight_scale": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.105.down_proj.weight": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.105.down_proj.weight_scale": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.105.gate_proj.weight": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.105.gate_proj.weight_scale": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.105.up_proj.weight": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.105.up_proj.weight_scale": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.106.down_proj.weight": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.106.down_proj.weight_scale": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.106.gate_proj.weight": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.106.gate_proj.weight_scale": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.106.up_proj.weight": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.106.up_proj.weight_scale": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.107.down_proj.weight": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.107.down_proj.weight_scale": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.107.gate_proj.weight": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.107.gate_proj.weight_scale": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.107.up_proj.weight": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.107.up_proj.weight_scale": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.108.down_proj.weight": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.108.down_proj.weight_scale": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.108.gate_proj.weight": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.108.gate_proj.weight_scale": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.108.up_proj.weight": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.108.up_proj.weight_scale": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.109.down_proj.weight": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.109.down_proj.weight_scale": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.109.gate_proj.weight": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.109.gate_proj.weight_scale": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.109.up_proj.weight": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.109.up_proj.weight_scale": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.11.down_proj.weight": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.11.down_proj.weight_scale": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.11.gate_proj.weight": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.11.gate_proj.weight_scale": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.11.up_proj.weight": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.11.up_proj.weight_scale": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.110.down_proj.weight": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.110.down_proj.weight_scale": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.110.gate_proj.weight": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.110.gate_proj.weight_scale": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.110.up_proj.weight": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.110.up_proj.weight_scale": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.111.down_proj.weight": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.111.down_proj.weight_scale": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.111.gate_proj.weight": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.111.gate_proj.weight_scale": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.111.up_proj.weight": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.111.up_proj.weight_scale": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.112.down_proj.weight": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.112.down_proj.weight_scale": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.112.gate_proj.weight": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.112.gate_proj.weight_scale": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.112.up_proj.weight": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.112.up_proj.weight_scale": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.113.down_proj.weight": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.113.down_proj.weight_scale": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.113.gate_proj.weight": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.113.gate_proj.weight_scale": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.113.up_proj.weight": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.113.up_proj.weight_scale": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.114.down_proj.weight": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.114.down_proj.weight_scale": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.114.gate_proj.weight": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.114.gate_proj.weight_scale": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.114.up_proj.weight": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.114.up_proj.weight_scale": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.115.down_proj.weight": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.115.down_proj.weight_scale": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.115.gate_proj.weight": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.115.gate_proj.weight_scale": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.115.up_proj.weight": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.115.up_proj.weight_scale": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.116.down_proj.weight": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.116.down_proj.weight_scale": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.116.gate_proj.weight": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.116.gate_proj.weight_scale": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.116.up_proj.weight": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.116.up_proj.weight_scale": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.117.down_proj.weight": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.117.down_proj.weight_scale": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.117.gate_proj.weight": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.117.gate_proj.weight_scale": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.117.up_proj.weight": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.117.up_proj.weight_scale": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.118.down_proj.weight": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.118.down_proj.weight_scale": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.118.gate_proj.weight": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.118.gate_proj.weight_scale": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.118.up_proj.weight": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.118.up_proj.weight_scale": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.119.down_proj.weight": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.119.down_proj.weight_scale": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.119.gate_proj.weight": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.119.gate_proj.weight_scale": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.119.up_proj.weight": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.119.up_proj.weight_scale": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.12.down_proj.weight": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.12.down_proj.weight_scale": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.12.gate_proj.weight": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.12.gate_proj.weight_scale": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.12.up_proj.weight": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.12.up_proj.weight_scale": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.120.down_proj.weight": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.120.down_proj.weight_scale": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.120.gate_proj.weight": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.120.gate_proj.weight_scale": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.120.up_proj.weight": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.120.up_proj.weight_scale": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.121.down_proj.weight": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.121.down_proj.weight_scale": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.121.gate_proj.weight": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.121.gate_proj.weight_scale": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.121.up_proj.weight": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.121.up_proj.weight_scale": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.122.down_proj.weight": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.122.down_proj.weight_scale": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.122.gate_proj.weight": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.122.gate_proj.weight_scale": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.122.up_proj.weight": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.122.up_proj.weight_scale": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.123.down_proj.weight": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.123.down_proj.weight_scale": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.123.gate_proj.weight": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.123.gate_proj.weight_scale": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.123.up_proj.weight": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.123.up_proj.weight_scale": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.124.down_proj.weight": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.124.down_proj.weight_scale": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.124.gate_proj.weight": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.124.gate_proj.weight_scale": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.124.up_proj.weight": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.124.up_proj.weight_scale": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.125.down_proj.weight": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.125.down_proj.weight_scale": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.125.gate_proj.weight": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.125.gate_proj.weight_scale": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.125.up_proj.weight": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.125.up_proj.weight_scale": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.126.down_proj.weight": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.126.down_proj.weight_scale": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.126.gate_proj.weight": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.126.gate_proj.weight_scale": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.126.up_proj.weight": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.126.up_proj.weight_scale": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.127.down_proj.weight": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.127.down_proj.weight_scale": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.127.gate_proj.weight": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.127.gate_proj.weight_scale": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.127.up_proj.weight": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.127.up_proj.weight_scale": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.128.down_proj.weight": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.128.down_proj.weight_scale": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.128.gate_proj.weight": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.128.gate_proj.weight_scale": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.128.up_proj.weight": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.128.up_proj.weight_scale": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.129.down_proj.weight": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.129.down_proj.weight_scale": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.129.gate_proj.weight": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.129.gate_proj.weight_scale": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.129.up_proj.weight": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.129.up_proj.weight_scale": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.13.down_proj.weight": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.13.down_proj.weight_scale": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.13.gate_proj.weight": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.13.gate_proj.weight_scale": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.13.up_proj.weight": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.13.up_proj.weight_scale": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.130.down_proj.weight": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.130.down_proj.weight_scale": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.130.gate_proj.weight": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.130.gate_proj.weight_scale": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.130.up_proj.weight": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.130.up_proj.weight_scale": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.131.down_proj.weight": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.131.down_proj.weight_scale": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.131.gate_proj.weight": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.131.gate_proj.weight_scale": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.131.up_proj.weight": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.131.up_proj.weight_scale": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.132.down_proj.weight": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.132.down_proj.weight_scale": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.132.gate_proj.weight": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.132.gate_proj.weight_scale": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.132.up_proj.weight": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.132.up_proj.weight_scale": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.133.down_proj.weight": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.133.down_proj.weight_scale": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.133.gate_proj.weight": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.133.gate_proj.weight_scale": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.133.up_proj.weight": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.133.up_proj.weight_scale": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.134.down_proj.weight": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.134.down_proj.weight_scale": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.134.gate_proj.weight": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.134.gate_proj.weight_scale": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.134.up_proj.weight": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.134.up_proj.weight_scale": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.135.down_proj.weight": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.135.down_proj.weight_scale": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.135.gate_proj.weight": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.135.gate_proj.weight_scale": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.135.up_proj.weight": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.135.up_proj.weight_scale": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.136.down_proj.weight": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.136.down_proj.weight_scale": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.136.gate_proj.weight": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.136.gate_proj.weight_scale": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.136.up_proj.weight": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.136.up_proj.weight_scale": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.137.down_proj.weight": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.137.down_proj.weight_scale": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.137.gate_proj.weight": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.137.gate_proj.weight_scale": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.137.up_proj.weight": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.137.up_proj.weight_scale": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.138.down_proj.weight": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.138.down_proj.weight_scale": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.138.gate_proj.weight": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.138.gate_proj.weight_scale": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.138.up_proj.weight": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.138.up_proj.weight_scale": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.139.down_proj.weight": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.139.down_proj.weight_scale": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.139.gate_proj.weight": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.139.gate_proj.weight_scale": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.139.up_proj.weight": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.139.up_proj.weight_scale": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.14.down_proj.weight": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.14.down_proj.weight_scale": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.14.gate_proj.weight": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.14.gate_proj.weight_scale": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.14.up_proj.weight": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.14.up_proj.weight_scale": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.140.down_proj.weight": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.140.down_proj.weight_scale": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.140.gate_proj.weight": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.140.gate_proj.weight_scale": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.140.up_proj.weight": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.140.up_proj.weight_scale": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.141.down_proj.weight": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.141.down_proj.weight_scale": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.141.gate_proj.weight": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.141.gate_proj.weight_scale": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.141.up_proj.weight": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.141.up_proj.weight_scale": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.142.down_proj.weight": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.142.down_proj.weight_scale": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.142.gate_proj.weight": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.142.gate_proj.weight_scale": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.142.up_proj.weight": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.142.up_proj.weight_scale": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.143.down_proj.weight": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.143.down_proj.weight_scale": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.143.gate_proj.weight": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.143.gate_proj.weight_scale": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.143.up_proj.weight": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.143.up_proj.weight_scale": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.144.down_proj.weight": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.144.down_proj.weight_scale": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.144.gate_proj.weight": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.144.gate_proj.weight_scale": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.144.up_proj.weight": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.144.up_proj.weight_scale": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.145.down_proj.weight": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.145.down_proj.weight_scale": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.145.gate_proj.weight": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.145.gate_proj.weight_scale": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.145.up_proj.weight": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.145.up_proj.weight_scale": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.146.down_proj.weight": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.146.down_proj.weight_scale": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.146.gate_proj.weight": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.146.gate_proj.weight_scale": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.146.up_proj.weight": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.146.up_proj.weight_scale": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.147.down_proj.weight": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.147.down_proj.weight_scale": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.147.gate_proj.weight": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.147.gate_proj.weight_scale": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.147.up_proj.weight": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.147.up_proj.weight_scale": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.148.down_proj.weight": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.148.down_proj.weight_scale": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.148.gate_proj.weight": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.148.gate_proj.weight_scale": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.148.up_proj.weight": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.148.up_proj.weight_scale": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.149.down_proj.weight": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.149.down_proj.weight_scale": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.149.gate_proj.weight": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.149.gate_proj.weight_scale": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.149.up_proj.weight": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.149.up_proj.weight_scale": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.15.down_proj.weight": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.15.down_proj.weight_scale": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.15.gate_proj.weight": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.15.gate_proj.weight_scale": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.15.up_proj.weight": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.15.up_proj.weight_scale": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.150.down_proj.weight": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.150.down_proj.weight_scale": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.150.gate_proj.weight": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.150.gate_proj.weight_scale": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.150.up_proj.weight": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.150.up_proj.weight_scale": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.151.down_proj.weight": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.151.down_proj.weight_scale": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.151.gate_proj.weight": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.151.gate_proj.weight_scale": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.151.up_proj.weight": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.151.up_proj.weight_scale": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.152.down_proj.weight": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.152.down_proj.weight_scale": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.152.gate_proj.weight": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.152.gate_proj.weight_scale": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.152.up_proj.weight": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.152.up_proj.weight_scale": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.153.down_proj.weight": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.153.down_proj.weight_scale": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.153.gate_proj.weight": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.153.gate_proj.weight_scale": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.153.up_proj.weight": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.153.up_proj.weight_scale": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.154.down_proj.weight": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.154.down_proj.weight_scale": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.154.gate_proj.weight": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.154.gate_proj.weight_scale": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.154.up_proj.weight": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.154.up_proj.weight_scale": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.155.down_proj.weight": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.155.down_proj.weight_scale": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.155.gate_proj.weight": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.155.gate_proj.weight_scale": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.155.up_proj.weight": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.155.up_proj.weight_scale": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.156.down_proj.weight": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.156.down_proj.weight_scale": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.156.gate_proj.weight": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.156.gate_proj.weight_scale": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.156.up_proj.weight": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.156.up_proj.weight_scale": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.157.down_proj.weight": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.157.down_proj.weight_scale": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.157.gate_proj.weight": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.157.gate_proj.weight_scale": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.157.up_proj.weight": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.157.up_proj.weight_scale": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.158.down_proj.weight": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.158.down_proj.weight_scale": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.158.gate_proj.weight": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.158.gate_proj.weight_scale": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.158.up_proj.weight": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.158.up_proj.weight_scale": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.159.down_proj.weight": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.159.down_proj.weight_scale": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.159.gate_proj.weight": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.159.gate_proj.weight_scale": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.159.up_proj.weight": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.159.up_proj.weight_scale": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.16.down_proj.weight": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.16.down_proj.weight_scale": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.16.gate_proj.weight": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.16.gate_proj.weight_scale": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.16.up_proj.weight": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.16.up_proj.weight_scale": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.17.down_proj.weight": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.17.down_proj.weight_scale": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.17.gate_proj.weight": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.17.gate_proj.weight_scale": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.17.up_proj.weight": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.17.up_proj.weight_scale": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.18.down_proj.weight": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.18.down_proj.weight_scale": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.18.gate_proj.weight": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.18.gate_proj.weight_scale": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.18.up_proj.weight": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.18.up_proj.weight_scale": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.19.down_proj.weight": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.19.down_proj.weight_scale": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.19.gate_proj.weight": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.19.gate_proj.weight_scale": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.19.up_proj.weight": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.19.up_proj.weight_scale": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.2.down_proj.weight": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.2.down_proj.weight_scale": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.2.gate_proj.weight": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.2.gate_proj.weight_scale": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.2.up_proj.weight": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.2.up_proj.weight_scale": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.20.down_proj.weight": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.20.down_proj.weight_scale": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.20.gate_proj.weight": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.20.gate_proj.weight_scale": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.20.up_proj.weight": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.20.up_proj.weight_scale": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.21.down_proj.weight": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.21.down_proj.weight_scale": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.21.gate_proj.weight": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.21.gate_proj.weight_scale": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.21.up_proj.weight": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.21.up_proj.weight_scale": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.22.down_proj.weight": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.22.down_proj.weight_scale": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.22.gate_proj.weight": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.22.gate_proj.weight_scale": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.22.up_proj.weight": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.22.up_proj.weight_scale": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.23.down_proj.weight": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.23.down_proj.weight_scale": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.23.gate_proj.weight": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.23.gate_proj.weight_scale": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.23.up_proj.weight": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.23.up_proj.weight_scale": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.24.down_proj.weight": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.24.down_proj.weight_scale": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.24.gate_proj.weight": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.24.gate_proj.weight_scale": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.24.up_proj.weight": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.24.up_proj.weight_scale": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.25.down_proj.weight": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.25.down_proj.weight_scale": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.25.gate_proj.weight": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.25.gate_proj.weight_scale": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.25.up_proj.weight": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.25.up_proj.weight_scale": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.26.down_proj.weight": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.26.down_proj.weight_scale": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.26.gate_proj.weight": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.26.gate_proj.weight_scale": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.26.up_proj.weight": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.26.up_proj.weight_scale": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.27.down_proj.weight": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.27.down_proj.weight_scale": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.27.gate_proj.weight": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.27.gate_proj.weight_scale": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.27.up_proj.weight": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.27.up_proj.weight_scale": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.28.down_proj.weight": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.28.down_proj.weight_scale": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.28.gate_proj.weight": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.28.gate_proj.weight_scale": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.28.up_proj.weight": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.28.up_proj.weight_scale": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.29.down_proj.weight": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.29.down_proj.weight_scale": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.29.gate_proj.weight": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.29.gate_proj.weight_scale": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.29.up_proj.weight": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.29.up_proj.weight_scale": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.3.down_proj.weight": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.3.down_proj.weight_scale": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.3.gate_proj.weight": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.3.gate_proj.weight_scale": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.3.up_proj.weight": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.3.up_proj.weight_scale": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.30.down_proj.weight": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.30.down_proj.weight_scale": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.30.gate_proj.weight": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.30.gate_proj.weight_scale": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.30.up_proj.weight": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.30.up_proj.weight_scale": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.31.down_proj.weight": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.31.down_proj.weight_scale": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.31.gate_proj.weight": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.31.gate_proj.weight_scale": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.31.up_proj.weight": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.31.up_proj.weight_scale": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.32.down_proj.weight": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.32.down_proj.weight_scale": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.32.gate_proj.weight": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.32.gate_proj.weight_scale": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.32.up_proj.weight": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.32.up_proj.weight_scale": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.33.down_proj.weight": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.33.down_proj.weight_scale": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.33.gate_proj.weight": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.33.gate_proj.weight_scale": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.33.up_proj.weight": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.33.up_proj.weight_scale": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.34.down_proj.weight": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.34.down_proj.weight_scale": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.34.gate_proj.weight": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.34.gate_proj.weight_scale": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.34.up_proj.weight": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.34.up_proj.weight_scale": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.35.down_proj.weight": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.35.down_proj.weight_scale": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.35.gate_proj.weight": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.35.gate_proj.weight_scale": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.35.up_proj.weight": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.35.up_proj.weight_scale": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.36.down_proj.weight": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.36.down_proj.weight_scale": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.36.gate_proj.weight": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.36.gate_proj.weight_scale": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.36.up_proj.weight": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.36.up_proj.weight_scale": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.37.down_proj.weight": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.37.down_proj.weight_scale": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.37.gate_proj.weight": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.37.gate_proj.weight_scale": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.37.up_proj.weight": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.37.up_proj.weight_scale": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.38.down_proj.weight": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.38.down_proj.weight_scale": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.38.gate_proj.weight": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.38.gate_proj.weight_scale": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.38.up_proj.weight": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.38.up_proj.weight_scale": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.39.down_proj.weight": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.39.down_proj.weight_scale": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.39.gate_proj.weight": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.39.gate_proj.weight_scale": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.39.up_proj.weight": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.39.up_proj.weight_scale": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.4.down_proj.weight": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.4.down_proj.weight_scale": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.4.gate_proj.weight": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.4.gate_proj.weight_scale": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.4.up_proj.weight": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.4.up_proj.weight_scale": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.40.down_proj.weight": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.40.down_proj.weight_scale": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.40.gate_proj.weight": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.40.gate_proj.weight_scale": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.40.up_proj.weight": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.40.up_proj.weight_scale": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.41.down_proj.weight": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.41.down_proj.weight_scale": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.41.gate_proj.weight": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.41.gate_proj.weight_scale": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.41.up_proj.weight": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.41.up_proj.weight_scale": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.42.down_proj.weight": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.42.down_proj.weight_scale": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.42.gate_proj.weight": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.42.gate_proj.weight_scale": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.42.up_proj.weight": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.42.up_proj.weight_scale": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.43.down_proj.weight": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.43.down_proj.weight_scale": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.43.gate_proj.weight": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.43.gate_proj.weight_scale": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.43.up_proj.weight": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.43.up_proj.weight_scale": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.44.down_proj.weight": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.44.down_proj.weight_scale": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.44.gate_proj.weight": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.44.gate_proj.weight_scale": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.44.up_proj.weight": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.44.up_proj.weight_scale": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.45.down_proj.weight": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.45.down_proj.weight_scale": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.45.gate_proj.weight": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.45.gate_proj.weight_scale": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.45.up_proj.weight": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.45.up_proj.weight_scale": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.46.down_proj.weight": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.46.down_proj.weight_scale": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.46.gate_proj.weight": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.46.gate_proj.weight_scale": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.46.up_proj.weight": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.46.up_proj.weight_scale": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.47.down_proj.weight": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.47.down_proj.weight_scale": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.47.gate_proj.weight": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.47.gate_proj.weight_scale": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.47.up_proj.weight": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.47.up_proj.weight_scale": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.48.down_proj.weight": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.48.down_proj.weight_scale": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.48.gate_proj.weight": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.48.gate_proj.weight_scale": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.48.up_proj.weight": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.48.up_proj.weight_scale": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.49.down_proj.weight": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.49.down_proj.weight_scale": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.49.gate_proj.weight": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.49.gate_proj.weight_scale": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.49.up_proj.weight": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.49.up_proj.weight_scale": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.5.down_proj.weight": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.5.down_proj.weight_scale": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.5.gate_proj.weight": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.5.gate_proj.weight_scale": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.5.up_proj.weight": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.5.up_proj.weight_scale": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.50.down_proj.weight": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.50.down_proj.weight_scale": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.50.gate_proj.weight": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.50.gate_proj.weight_scale": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.50.up_proj.weight": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.50.up_proj.weight_scale": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.51.down_proj.weight": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.51.down_proj.weight_scale": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.51.gate_proj.weight": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.51.gate_proj.weight_scale": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.51.up_proj.weight": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.51.up_proj.weight_scale": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.52.down_proj.weight": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.52.down_proj.weight_scale": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.52.gate_proj.weight": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.52.gate_proj.weight_scale": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.52.up_proj.weight": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.52.up_proj.weight_scale": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.53.down_proj.weight": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.53.down_proj.weight_scale": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.53.gate_proj.weight": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.53.gate_proj.weight_scale": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.53.up_proj.weight": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.53.up_proj.weight_scale": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.54.down_proj.weight": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.54.down_proj.weight_scale": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.54.gate_proj.weight": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.54.gate_proj.weight_scale": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.54.up_proj.weight": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.54.up_proj.weight_scale": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.55.down_proj.weight": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.55.down_proj.weight_scale": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.55.gate_proj.weight": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.55.gate_proj.weight_scale": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.55.up_proj.weight": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.55.up_proj.weight_scale": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.56.down_proj.weight": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.56.down_proj.weight_scale": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.56.gate_proj.weight": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.56.gate_proj.weight_scale": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.56.up_proj.weight": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.56.up_proj.weight_scale": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.57.down_proj.weight": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.57.down_proj.weight_scale": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.57.gate_proj.weight": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.57.gate_proj.weight_scale": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.57.up_proj.weight": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.57.up_proj.weight_scale": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.58.down_proj.weight": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.58.down_proj.weight_scale": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.58.gate_proj.weight": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.58.gate_proj.weight_scale": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.58.up_proj.weight": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.58.up_proj.weight_scale": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.59.down_proj.weight": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.59.down_proj.weight_scale": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.59.gate_proj.weight": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.59.gate_proj.weight_scale": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.59.up_proj.weight": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.59.up_proj.weight_scale": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.6.down_proj.weight": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.6.down_proj.weight_scale": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.6.gate_proj.weight": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.6.gate_proj.weight_scale": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.6.up_proj.weight": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.6.up_proj.weight_scale": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.60.down_proj.weight": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.60.down_proj.weight_scale": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.60.gate_proj.weight": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.60.gate_proj.weight_scale": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.60.up_proj.weight": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.60.up_proj.weight_scale": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.61.down_proj.weight": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.61.down_proj.weight_scale": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.61.gate_proj.weight": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.61.gate_proj.weight_scale": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.61.up_proj.weight": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.61.up_proj.weight_scale": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.62.down_proj.weight": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.62.down_proj.weight_scale": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.62.gate_proj.weight": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.62.gate_proj.weight_scale": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.62.up_proj.weight": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.62.up_proj.weight_scale": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.63.down_proj.weight": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.63.down_proj.weight_scale": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.63.gate_proj.weight": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.63.gate_proj.weight_scale": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.63.up_proj.weight": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.63.up_proj.weight_scale": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.64.down_proj.weight": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.64.down_proj.weight_scale": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.64.gate_proj.weight": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.64.gate_proj.weight_scale": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.64.up_proj.weight": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.64.up_proj.weight_scale": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.65.down_proj.weight": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.65.down_proj.weight_scale": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.65.gate_proj.weight": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.65.gate_proj.weight_scale": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.65.up_proj.weight": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.65.up_proj.weight_scale": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.66.down_proj.weight": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.66.down_proj.weight_scale": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.66.gate_proj.weight": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.66.gate_proj.weight_scale": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.66.up_proj.weight": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.66.up_proj.weight_scale": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.67.down_proj.weight": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.67.down_proj.weight_scale": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.67.gate_proj.weight": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.67.gate_proj.weight_scale": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.67.up_proj.weight": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.67.up_proj.weight_scale": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.68.down_proj.weight": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.68.down_proj.weight_scale": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.68.gate_proj.weight": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.68.gate_proj.weight_scale": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.68.up_proj.weight": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.68.up_proj.weight_scale": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.69.down_proj.weight": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.69.down_proj.weight_scale": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.69.gate_proj.weight": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.69.gate_proj.weight_scale": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.69.up_proj.weight": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.69.up_proj.weight_scale": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.7.down_proj.weight": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.7.down_proj.weight_scale": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.7.gate_proj.weight": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.7.gate_proj.weight_scale": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.7.up_proj.weight": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.7.up_proj.weight_scale": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.70.down_proj.weight": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.70.down_proj.weight_scale": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.70.gate_proj.weight": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.70.gate_proj.weight_scale": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.70.up_proj.weight": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.70.up_proj.weight_scale": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.71.down_proj.weight": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.71.down_proj.weight_scale": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.71.gate_proj.weight": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.71.gate_proj.weight_scale": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.71.up_proj.weight": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.71.up_proj.weight_scale": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.72.down_proj.weight": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.72.down_proj.weight_scale": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.72.gate_proj.weight": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.72.gate_proj.weight_scale": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.72.up_proj.weight": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.72.up_proj.weight_scale": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.73.down_proj.weight": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.73.down_proj.weight_scale": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.73.gate_proj.weight": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.73.gate_proj.weight_scale": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.73.up_proj.weight": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.73.up_proj.weight_scale": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.74.down_proj.weight": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.74.down_proj.weight_scale": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.74.gate_proj.weight": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.74.gate_proj.weight_scale": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.74.up_proj.weight": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.74.up_proj.weight_scale": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.75.down_proj.weight": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.75.down_proj.weight_scale": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.75.gate_proj.weight": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.75.gate_proj.weight_scale": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.75.up_proj.weight": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.75.up_proj.weight_scale": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.76.down_proj.weight": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.76.down_proj.weight_scale": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.76.gate_proj.weight": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.76.gate_proj.weight_scale": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.76.up_proj.weight": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.76.up_proj.weight_scale": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.77.down_proj.weight": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.77.down_proj.weight_scale": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.77.gate_proj.weight": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.77.gate_proj.weight_scale": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.77.up_proj.weight": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.77.up_proj.weight_scale": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.78.down_proj.weight": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.78.down_proj.weight_scale": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.78.gate_proj.weight": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.78.gate_proj.weight_scale": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.78.up_proj.weight": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.78.up_proj.weight_scale": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.79.down_proj.weight": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.79.down_proj.weight_scale": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.79.gate_proj.weight": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.79.gate_proj.weight_scale": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.79.up_proj.weight": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.79.up_proj.weight_scale": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.8.down_proj.weight": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.8.down_proj.weight_scale": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.8.gate_proj.weight": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.8.gate_proj.weight_scale": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.8.up_proj.weight": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.8.up_proj.weight_scale": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.80.down_proj.weight": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.80.down_proj.weight_scale": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.80.gate_proj.weight": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.80.gate_proj.weight_scale": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.80.up_proj.weight": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.80.up_proj.weight_scale": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.81.down_proj.weight": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.81.down_proj.weight_scale": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.81.gate_proj.weight": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.81.gate_proj.weight_scale": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.81.up_proj.weight": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.81.up_proj.weight_scale": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.82.down_proj.weight": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.82.down_proj.weight_scale": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.82.gate_proj.weight": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.82.gate_proj.weight_scale": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.82.up_proj.weight": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.82.up_proj.weight_scale": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.83.down_proj.weight": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.83.down_proj.weight_scale": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.83.gate_proj.weight": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.83.gate_proj.weight_scale": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.83.up_proj.weight": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.83.up_proj.weight_scale": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.84.down_proj.weight": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.84.down_proj.weight_scale": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.84.gate_proj.weight": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.84.gate_proj.weight_scale": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.84.up_proj.weight": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.84.up_proj.weight_scale": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.85.down_proj.weight": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.85.down_proj.weight_scale": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.85.gate_proj.weight": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.85.gate_proj.weight_scale": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.85.up_proj.weight": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.85.up_proj.weight_scale": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.86.down_proj.weight": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.86.down_proj.weight_scale": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.86.gate_proj.weight": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.86.gate_proj.weight_scale": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.86.up_proj.weight": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.86.up_proj.weight_scale": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.87.down_proj.weight": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.87.down_proj.weight_scale": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.87.gate_proj.weight": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.87.gate_proj.weight_scale": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.87.up_proj.weight": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.87.up_proj.weight_scale": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.88.down_proj.weight": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.88.down_proj.weight_scale": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.88.gate_proj.weight": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.88.gate_proj.weight_scale": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.88.up_proj.weight": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.88.up_proj.weight_scale": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.89.down_proj.weight": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.89.down_proj.weight_scale": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.89.gate_proj.weight": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.89.gate_proj.weight_scale": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.89.up_proj.weight": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.89.up_proj.weight_scale": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.9.down_proj.weight": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.9.down_proj.weight_scale": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.9.gate_proj.weight": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.9.gate_proj.weight_scale": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.9.up_proj.weight": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.9.up_proj.weight_scale": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.90.down_proj.weight": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.90.down_proj.weight_scale": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.90.gate_proj.weight": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.90.gate_proj.weight_scale": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.90.up_proj.weight": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.90.up_proj.weight_scale": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.91.down_proj.weight": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.91.down_proj.weight_scale": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.91.gate_proj.weight": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.91.gate_proj.weight_scale": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.91.up_proj.weight": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.91.up_proj.weight_scale": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.92.down_proj.weight": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.92.down_proj.weight_scale": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.92.gate_proj.weight": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.92.gate_proj.weight_scale": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.92.up_proj.weight": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.92.up_proj.weight_scale": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.93.down_proj.weight": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.93.down_proj.weight_scale": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.93.gate_proj.weight": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.93.gate_proj.weight_scale": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.93.up_proj.weight": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.93.up_proj.weight_scale": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.94.down_proj.weight": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.94.down_proj.weight_scale": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.94.gate_proj.weight": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.94.gate_proj.weight_scale": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.94.up_proj.weight": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.94.up_proj.weight_scale": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.95.down_proj.weight": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.95.down_proj.weight_scale": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.95.gate_proj.weight": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.95.gate_proj.weight_scale": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.95.up_proj.weight": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.95.up_proj.weight_scale": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.96.down_proj.weight": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.96.down_proj.weight_scale": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.96.gate_proj.weight": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.96.gate_proj.weight_scale": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.96.up_proj.weight": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.96.up_proj.weight_scale": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.97.down_proj.weight": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.97.down_proj.weight_scale": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.97.gate_proj.weight": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.97.gate_proj.weight_scale": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.97.up_proj.weight": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.97.up_proj.weight_scale": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.98.down_proj.weight": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.98.down_proj.weight_scale": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.98.gate_proj.weight": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.98.gate_proj.weight_scale": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.98.up_proj.weight": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.98.up_proj.weight_scale": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.99.down_proj.weight": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.99.down_proj.weight_scale": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.99.gate_proj.weight": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.99.gate_proj.weight_scale": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.99.up_proj.weight": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.99.up_proj.weight_scale": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.gate.e_score_correction_bias": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.gate.weight": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.shared_experts.down_proj.weight": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.shared_experts.down_proj.weight_scale": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.shared_experts.gate_proj.weight": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.shared_experts.gate_proj.weight_scale": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.shared_experts.up_proj.weight": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.shared_experts.up_proj.weight_scale": "model-00014-of-00092.safetensors",
+ "model.layers.13.post_attention_layernorm.weight": "model-00014-of-00092.safetensors",
+ "model.layers.13.self_attn.k_norm.weight": "model-00014-of-00092.safetensors",
+ "model.layers.13.self_attn.k_proj.bias": "model-00014-of-00092.safetensors",
+ "model.layers.13.self_attn.k_proj.weight": "model-00014-of-00092.safetensors",
+ "model.layers.13.self_attn.k_proj.weight_scale": "model-00014-of-00092.safetensors",
+ "model.layers.13.self_attn.o_proj.weight": "model-00014-of-00092.safetensors",
+ "model.layers.13.self_attn.o_proj.weight_scale": "model-00014-of-00092.safetensors",
+ "model.layers.13.self_attn.q_norm.weight": "model-00014-of-00092.safetensors",
+ "model.layers.13.self_attn.q_proj.bias": "model-00014-of-00092.safetensors",
+ "model.layers.13.self_attn.q_proj.weight": "model-00014-of-00092.safetensors",
+ "model.layers.13.self_attn.q_proj.weight_scale": "model-00014-of-00092.safetensors",
+ "model.layers.13.self_attn.v_proj.bias": "model-00014-of-00092.safetensors",
+ "model.layers.13.self_attn.v_proj.weight": "model-00014-of-00092.safetensors",
+ "model.layers.13.self_attn.v_proj.weight_scale": "model-00014-of-00092.safetensors",
+ "model.layers.14.input_layernorm.weight": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.0.down_proj.weight": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.0.down_proj.weight_scale": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.0.gate_proj.weight": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.0.gate_proj.weight_scale": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.0.up_proj.weight": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.0.up_proj.weight_scale": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.1.down_proj.weight": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.1.down_proj.weight_scale": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.1.gate_proj.weight": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.1.gate_proj.weight_scale": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.1.up_proj.weight": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.1.up_proj.weight_scale": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.10.down_proj.weight": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.10.down_proj.weight_scale": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.10.gate_proj.weight": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.10.gate_proj.weight_scale": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.10.up_proj.weight": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.10.up_proj.weight_scale": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.100.down_proj.weight": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.100.down_proj.weight_scale": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.100.gate_proj.weight": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.100.gate_proj.weight_scale": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.100.up_proj.weight": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.100.up_proj.weight_scale": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.101.down_proj.weight": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.101.down_proj.weight_scale": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.101.gate_proj.weight": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.101.gate_proj.weight_scale": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.101.up_proj.weight": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.101.up_proj.weight_scale": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.102.down_proj.weight": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.102.down_proj.weight_scale": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.102.gate_proj.weight": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.102.gate_proj.weight_scale": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.102.up_proj.weight": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.102.up_proj.weight_scale": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.103.down_proj.weight": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.103.down_proj.weight_scale": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.103.gate_proj.weight": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.103.gate_proj.weight_scale": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.103.up_proj.weight": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.103.up_proj.weight_scale": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.104.down_proj.weight": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.104.down_proj.weight_scale": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.104.gate_proj.weight": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.104.gate_proj.weight_scale": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.104.up_proj.weight": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.104.up_proj.weight_scale": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.105.down_proj.weight": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.105.down_proj.weight_scale": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.105.gate_proj.weight": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.105.gate_proj.weight_scale": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.105.up_proj.weight": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.105.up_proj.weight_scale": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.106.down_proj.weight": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.106.down_proj.weight_scale": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.106.gate_proj.weight": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.106.gate_proj.weight_scale": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.106.up_proj.weight": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.106.up_proj.weight_scale": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.107.down_proj.weight": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.107.down_proj.weight_scale": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.107.gate_proj.weight": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.107.gate_proj.weight_scale": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.107.up_proj.weight": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.107.up_proj.weight_scale": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.108.down_proj.weight": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.108.down_proj.weight_scale": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.108.gate_proj.weight": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.108.gate_proj.weight_scale": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.108.up_proj.weight": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.108.up_proj.weight_scale": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.109.down_proj.weight": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.109.down_proj.weight_scale": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.109.gate_proj.weight": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.109.gate_proj.weight_scale": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.109.up_proj.weight": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.109.up_proj.weight_scale": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.11.down_proj.weight": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.11.down_proj.weight_scale": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.11.gate_proj.weight": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.11.gate_proj.weight_scale": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.11.up_proj.weight": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.11.up_proj.weight_scale": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.110.down_proj.weight": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.110.down_proj.weight_scale": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.110.gate_proj.weight": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.110.gate_proj.weight_scale": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.110.up_proj.weight": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.110.up_proj.weight_scale": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.111.down_proj.weight": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.111.down_proj.weight_scale": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.111.gate_proj.weight": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.111.gate_proj.weight_scale": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.111.up_proj.weight": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.111.up_proj.weight_scale": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.112.down_proj.weight": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.112.down_proj.weight_scale": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.112.gate_proj.weight": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.112.gate_proj.weight_scale": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.112.up_proj.weight": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.112.up_proj.weight_scale": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.113.down_proj.weight": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.113.down_proj.weight_scale": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.113.gate_proj.weight": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.113.gate_proj.weight_scale": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.113.up_proj.weight": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.113.up_proj.weight_scale": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.114.down_proj.weight": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.114.down_proj.weight_scale": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.114.gate_proj.weight": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.114.gate_proj.weight_scale": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.114.up_proj.weight": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.114.up_proj.weight_scale": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.115.down_proj.weight": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.115.down_proj.weight_scale": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.115.gate_proj.weight": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.115.gate_proj.weight_scale": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.115.up_proj.weight": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.115.up_proj.weight_scale": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.116.down_proj.weight": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.116.down_proj.weight_scale": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.116.gate_proj.weight": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.116.gate_proj.weight_scale": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.116.up_proj.weight": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.116.up_proj.weight_scale": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.117.down_proj.weight": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.117.down_proj.weight_scale": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.117.gate_proj.weight": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.117.gate_proj.weight_scale": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.117.up_proj.weight": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.117.up_proj.weight_scale": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.118.down_proj.weight": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.118.down_proj.weight_scale": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.118.gate_proj.weight": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.118.gate_proj.weight_scale": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.118.up_proj.weight": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.118.up_proj.weight_scale": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.119.down_proj.weight": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.119.down_proj.weight_scale": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.119.gate_proj.weight": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.119.gate_proj.weight_scale": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.119.up_proj.weight": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.119.up_proj.weight_scale": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.12.down_proj.weight": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.12.down_proj.weight_scale": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.12.gate_proj.weight": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.12.gate_proj.weight_scale": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.12.up_proj.weight": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.12.up_proj.weight_scale": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.120.down_proj.weight": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.120.down_proj.weight_scale": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.120.gate_proj.weight": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.120.gate_proj.weight_scale": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.120.up_proj.weight": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.120.up_proj.weight_scale": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.121.down_proj.weight": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.121.down_proj.weight_scale": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.121.gate_proj.weight": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.121.gate_proj.weight_scale": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.121.up_proj.weight": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.121.up_proj.weight_scale": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.122.down_proj.weight": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.122.down_proj.weight_scale": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.122.gate_proj.weight": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.122.gate_proj.weight_scale": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.122.up_proj.weight": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.122.up_proj.weight_scale": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.123.down_proj.weight": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.123.down_proj.weight_scale": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.123.gate_proj.weight": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.123.gate_proj.weight_scale": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.123.up_proj.weight": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.123.up_proj.weight_scale": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.124.down_proj.weight": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.124.down_proj.weight_scale": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.124.gate_proj.weight": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.124.gate_proj.weight_scale": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.124.up_proj.weight": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.124.up_proj.weight_scale": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.125.down_proj.weight": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.125.down_proj.weight_scale": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.125.gate_proj.weight": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.125.gate_proj.weight_scale": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.125.up_proj.weight": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.125.up_proj.weight_scale": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.126.down_proj.weight": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.126.down_proj.weight_scale": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.126.gate_proj.weight": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.126.gate_proj.weight_scale": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.126.up_proj.weight": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.126.up_proj.weight_scale": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.127.down_proj.weight": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.127.down_proj.weight_scale": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.127.gate_proj.weight": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.127.gate_proj.weight_scale": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.127.up_proj.weight": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.127.up_proj.weight_scale": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.128.down_proj.weight": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.128.down_proj.weight_scale": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.128.gate_proj.weight": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.128.gate_proj.weight_scale": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.128.up_proj.weight": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.128.up_proj.weight_scale": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.129.down_proj.weight": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.129.down_proj.weight_scale": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.129.gate_proj.weight": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.129.gate_proj.weight_scale": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.129.up_proj.weight": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.129.up_proj.weight_scale": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.13.down_proj.weight": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.13.down_proj.weight_scale": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.13.gate_proj.weight": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.13.gate_proj.weight_scale": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.13.up_proj.weight": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.13.up_proj.weight_scale": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.130.down_proj.weight": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.130.down_proj.weight_scale": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.130.gate_proj.weight": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.130.gate_proj.weight_scale": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.130.up_proj.weight": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.130.up_proj.weight_scale": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.131.down_proj.weight": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.131.down_proj.weight_scale": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.131.gate_proj.weight": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.131.gate_proj.weight_scale": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.131.up_proj.weight": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.131.up_proj.weight_scale": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.132.down_proj.weight": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.132.down_proj.weight_scale": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.132.gate_proj.weight": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.132.gate_proj.weight_scale": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.132.up_proj.weight": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.132.up_proj.weight_scale": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.133.down_proj.weight": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.133.down_proj.weight_scale": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.133.gate_proj.weight": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.133.gate_proj.weight_scale": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.133.up_proj.weight": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.133.up_proj.weight_scale": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.134.down_proj.weight": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.134.down_proj.weight_scale": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.134.gate_proj.weight": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.134.gate_proj.weight_scale": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.134.up_proj.weight": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.134.up_proj.weight_scale": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.135.down_proj.weight": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.135.down_proj.weight_scale": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.135.gate_proj.weight": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.135.gate_proj.weight_scale": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.135.up_proj.weight": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.135.up_proj.weight_scale": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.136.down_proj.weight": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.136.down_proj.weight_scale": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.136.gate_proj.weight": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.136.gate_proj.weight_scale": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.136.up_proj.weight": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.136.up_proj.weight_scale": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.137.down_proj.weight": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.137.down_proj.weight_scale": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.137.gate_proj.weight": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.137.gate_proj.weight_scale": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.137.up_proj.weight": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.137.up_proj.weight_scale": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.138.down_proj.weight": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.138.down_proj.weight_scale": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.138.gate_proj.weight": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.138.gate_proj.weight_scale": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.138.up_proj.weight": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.138.up_proj.weight_scale": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.139.down_proj.weight": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.139.down_proj.weight_scale": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.139.gate_proj.weight": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.139.gate_proj.weight_scale": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.139.up_proj.weight": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.139.up_proj.weight_scale": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.14.down_proj.weight": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.14.down_proj.weight_scale": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.14.gate_proj.weight": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.14.gate_proj.weight_scale": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.14.up_proj.weight": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.14.up_proj.weight_scale": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.140.down_proj.weight": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.140.down_proj.weight_scale": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.140.gate_proj.weight": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.140.gate_proj.weight_scale": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.140.up_proj.weight": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.140.up_proj.weight_scale": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.141.down_proj.weight": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.141.down_proj.weight_scale": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.141.gate_proj.weight": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.141.gate_proj.weight_scale": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.141.up_proj.weight": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.141.up_proj.weight_scale": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.142.down_proj.weight": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.142.down_proj.weight_scale": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.142.gate_proj.weight": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.142.gate_proj.weight_scale": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.142.up_proj.weight": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.142.up_proj.weight_scale": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.143.down_proj.weight": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.143.down_proj.weight_scale": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.143.gate_proj.weight": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.143.gate_proj.weight_scale": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.143.up_proj.weight": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.143.up_proj.weight_scale": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.144.down_proj.weight": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.144.down_proj.weight_scale": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.144.gate_proj.weight": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.144.gate_proj.weight_scale": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.144.up_proj.weight": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.144.up_proj.weight_scale": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.145.down_proj.weight": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.145.down_proj.weight_scale": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.145.gate_proj.weight": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.145.gate_proj.weight_scale": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.145.up_proj.weight": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.145.up_proj.weight_scale": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.146.down_proj.weight": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.146.down_proj.weight_scale": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.146.gate_proj.weight": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.146.gate_proj.weight_scale": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.146.up_proj.weight": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.146.up_proj.weight_scale": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.147.down_proj.weight": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.147.down_proj.weight_scale": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.147.gate_proj.weight": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.147.gate_proj.weight_scale": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.147.up_proj.weight": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.147.up_proj.weight_scale": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.148.down_proj.weight": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.148.down_proj.weight_scale": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.148.gate_proj.weight": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.148.gate_proj.weight_scale": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.148.up_proj.weight": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.148.up_proj.weight_scale": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.149.down_proj.weight": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.149.down_proj.weight_scale": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.149.gate_proj.weight": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.149.gate_proj.weight_scale": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.149.up_proj.weight": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.149.up_proj.weight_scale": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.15.down_proj.weight": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.15.down_proj.weight_scale": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.15.gate_proj.weight": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.15.gate_proj.weight_scale": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.15.up_proj.weight": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.15.up_proj.weight_scale": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.150.down_proj.weight": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.150.down_proj.weight_scale": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.150.gate_proj.weight": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.150.gate_proj.weight_scale": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.150.up_proj.weight": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.150.up_proj.weight_scale": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.151.down_proj.weight": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.151.down_proj.weight_scale": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.151.gate_proj.weight": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.151.gate_proj.weight_scale": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.151.up_proj.weight": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.151.up_proj.weight_scale": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.152.down_proj.weight": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.152.down_proj.weight_scale": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.152.gate_proj.weight": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.152.gate_proj.weight_scale": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.152.up_proj.weight": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.152.up_proj.weight_scale": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.153.down_proj.weight": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.153.down_proj.weight_scale": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.153.gate_proj.weight": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.153.gate_proj.weight_scale": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.153.up_proj.weight": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.153.up_proj.weight_scale": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.154.down_proj.weight": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.154.down_proj.weight_scale": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.154.gate_proj.weight": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.154.gate_proj.weight_scale": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.154.up_proj.weight": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.154.up_proj.weight_scale": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.155.down_proj.weight": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.155.down_proj.weight_scale": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.155.gate_proj.weight": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.155.gate_proj.weight_scale": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.155.up_proj.weight": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.155.up_proj.weight_scale": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.156.down_proj.weight": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.156.down_proj.weight_scale": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.156.gate_proj.weight": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.156.gate_proj.weight_scale": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.156.up_proj.weight": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.156.up_proj.weight_scale": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.157.down_proj.weight": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.157.down_proj.weight_scale": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.157.gate_proj.weight": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.157.gate_proj.weight_scale": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.157.up_proj.weight": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.157.up_proj.weight_scale": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.158.down_proj.weight": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.158.down_proj.weight_scale": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.158.gate_proj.weight": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.158.gate_proj.weight_scale": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.158.up_proj.weight": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.158.up_proj.weight_scale": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.159.down_proj.weight": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.159.down_proj.weight_scale": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.159.gate_proj.weight": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.159.gate_proj.weight_scale": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.159.up_proj.weight": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.159.up_proj.weight_scale": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.16.down_proj.weight": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.16.down_proj.weight_scale": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.16.gate_proj.weight": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.16.gate_proj.weight_scale": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.16.up_proj.weight": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.16.up_proj.weight_scale": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.17.down_proj.weight": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.17.down_proj.weight_scale": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.17.gate_proj.weight": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.17.gate_proj.weight_scale": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.17.up_proj.weight": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.17.up_proj.weight_scale": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.18.down_proj.weight": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.18.down_proj.weight_scale": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.18.gate_proj.weight": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.18.gate_proj.weight_scale": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.18.up_proj.weight": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.18.up_proj.weight_scale": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.19.down_proj.weight": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.19.down_proj.weight_scale": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.19.gate_proj.weight": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.19.gate_proj.weight_scale": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.19.up_proj.weight": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.19.up_proj.weight_scale": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.2.down_proj.weight": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.2.down_proj.weight_scale": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.2.gate_proj.weight": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.2.gate_proj.weight_scale": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.2.up_proj.weight": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.2.up_proj.weight_scale": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.20.down_proj.weight": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.20.down_proj.weight_scale": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.20.gate_proj.weight": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.20.gate_proj.weight_scale": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.20.up_proj.weight": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.20.up_proj.weight_scale": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.21.down_proj.weight": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.21.down_proj.weight_scale": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.21.gate_proj.weight": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.21.gate_proj.weight_scale": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.21.up_proj.weight": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.21.up_proj.weight_scale": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.22.down_proj.weight": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.22.down_proj.weight_scale": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.22.gate_proj.weight": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.22.gate_proj.weight_scale": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.22.up_proj.weight": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.22.up_proj.weight_scale": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.23.down_proj.weight": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.23.down_proj.weight_scale": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.23.gate_proj.weight": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.23.gate_proj.weight_scale": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.23.up_proj.weight": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.23.up_proj.weight_scale": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.24.down_proj.weight": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.24.down_proj.weight_scale": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.24.gate_proj.weight": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.24.gate_proj.weight_scale": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.24.up_proj.weight": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.24.up_proj.weight_scale": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.25.down_proj.weight": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.25.down_proj.weight_scale": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.25.gate_proj.weight": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.25.gate_proj.weight_scale": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.25.up_proj.weight": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.25.up_proj.weight_scale": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.26.down_proj.weight": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.26.down_proj.weight_scale": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.26.gate_proj.weight": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.26.gate_proj.weight_scale": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.26.up_proj.weight": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.26.up_proj.weight_scale": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.27.down_proj.weight": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.27.down_proj.weight_scale": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.27.gate_proj.weight": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.27.gate_proj.weight_scale": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.27.up_proj.weight": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.27.up_proj.weight_scale": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.28.down_proj.weight": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.28.down_proj.weight_scale": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.28.gate_proj.weight": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.28.gate_proj.weight_scale": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.28.up_proj.weight": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.28.up_proj.weight_scale": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.29.down_proj.weight": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.29.down_proj.weight_scale": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.29.gate_proj.weight": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.29.gate_proj.weight_scale": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.29.up_proj.weight": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.29.up_proj.weight_scale": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.3.down_proj.weight": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.3.down_proj.weight_scale": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.3.gate_proj.weight": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.3.gate_proj.weight_scale": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.3.up_proj.weight": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.3.up_proj.weight_scale": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.30.down_proj.weight": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.30.down_proj.weight_scale": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.30.gate_proj.weight": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.30.gate_proj.weight_scale": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.30.up_proj.weight": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.30.up_proj.weight_scale": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.31.down_proj.weight": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.31.down_proj.weight_scale": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.31.gate_proj.weight": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.31.gate_proj.weight_scale": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.31.up_proj.weight": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.31.up_proj.weight_scale": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.32.down_proj.weight": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.32.down_proj.weight_scale": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.32.gate_proj.weight": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.32.gate_proj.weight_scale": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.32.up_proj.weight": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.32.up_proj.weight_scale": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.33.down_proj.weight": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.33.down_proj.weight_scale": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.33.gate_proj.weight": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.33.gate_proj.weight_scale": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.33.up_proj.weight": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.33.up_proj.weight_scale": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.34.down_proj.weight": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.34.down_proj.weight_scale": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.34.gate_proj.weight": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.34.gate_proj.weight_scale": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.34.up_proj.weight": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.34.up_proj.weight_scale": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.35.down_proj.weight": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.35.down_proj.weight_scale": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.35.gate_proj.weight": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.35.gate_proj.weight_scale": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.35.up_proj.weight": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.35.up_proj.weight_scale": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.36.down_proj.weight": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.36.down_proj.weight_scale": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.36.gate_proj.weight": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.36.gate_proj.weight_scale": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.36.up_proj.weight": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.36.up_proj.weight_scale": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.37.down_proj.weight": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.37.down_proj.weight_scale": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.37.gate_proj.weight": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.37.gate_proj.weight_scale": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.37.up_proj.weight": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.37.up_proj.weight_scale": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.38.down_proj.weight": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.38.down_proj.weight_scale": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.38.gate_proj.weight": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.38.gate_proj.weight_scale": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.38.up_proj.weight": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.38.up_proj.weight_scale": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.39.down_proj.weight": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.39.down_proj.weight_scale": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.39.gate_proj.weight": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.39.gate_proj.weight_scale": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.39.up_proj.weight": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.39.up_proj.weight_scale": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.4.down_proj.weight": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.4.down_proj.weight_scale": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.4.gate_proj.weight": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.4.gate_proj.weight_scale": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.4.up_proj.weight": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.4.up_proj.weight_scale": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.40.down_proj.weight": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.40.down_proj.weight_scale": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.40.gate_proj.weight": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.40.gate_proj.weight_scale": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.40.up_proj.weight": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.40.up_proj.weight_scale": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.41.down_proj.weight": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.41.down_proj.weight_scale": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.41.gate_proj.weight": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.41.gate_proj.weight_scale": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.41.up_proj.weight": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.41.up_proj.weight_scale": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.42.down_proj.weight": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.42.down_proj.weight_scale": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.42.gate_proj.weight": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.42.gate_proj.weight_scale": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.42.up_proj.weight": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.42.up_proj.weight_scale": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.43.down_proj.weight": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.43.down_proj.weight_scale": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.43.gate_proj.weight": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.43.gate_proj.weight_scale": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.43.up_proj.weight": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.43.up_proj.weight_scale": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.44.down_proj.weight": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.44.down_proj.weight_scale": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.44.gate_proj.weight": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.44.gate_proj.weight_scale": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.44.up_proj.weight": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.44.up_proj.weight_scale": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.45.down_proj.weight": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.45.down_proj.weight_scale": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.45.gate_proj.weight": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.45.gate_proj.weight_scale": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.45.up_proj.weight": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.45.up_proj.weight_scale": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.46.down_proj.weight": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.46.down_proj.weight_scale": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.46.gate_proj.weight": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.46.gate_proj.weight_scale": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.46.up_proj.weight": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.46.up_proj.weight_scale": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.47.down_proj.weight": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.47.down_proj.weight_scale": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.47.gate_proj.weight": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.47.gate_proj.weight_scale": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.47.up_proj.weight": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.47.up_proj.weight_scale": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.48.down_proj.weight": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.48.down_proj.weight_scale": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.48.gate_proj.weight": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.48.gate_proj.weight_scale": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.48.up_proj.weight": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.48.up_proj.weight_scale": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.49.down_proj.weight": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.49.down_proj.weight_scale": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.49.gate_proj.weight": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.49.gate_proj.weight_scale": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.49.up_proj.weight": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.49.up_proj.weight_scale": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.5.down_proj.weight": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.5.down_proj.weight_scale": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.5.gate_proj.weight": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.5.gate_proj.weight_scale": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.5.up_proj.weight": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.5.up_proj.weight_scale": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.50.down_proj.weight": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.50.down_proj.weight_scale": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.50.gate_proj.weight": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.50.gate_proj.weight_scale": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.50.up_proj.weight": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.50.up_proj.weight_scale": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.51.down_proj.weight": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.51.down_proj.weight_scale": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.51.gate_proj.weight": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.51.gate_proj.weight_scale": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.51.up_proj.weight": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.51.up_proj.weight_scale": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.52.down_proj.weight": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.52.down_proj.weight_scale": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.52.gate_proj.weight": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.52.gate_proj.weight_scale": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.52.up_proj.weight": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.52.up_proj.weight_scale": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.53.down_proj.weight": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.53.down_proj.weight_scale": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.53.gate_proj.weight": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.53.gate_proj.weight_scale": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.53.up_proj.weight": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.53.up_proj.weight_scale": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.54.down_proj.weight": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.54.down_proj.weight_scale": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.54.gate_proj.weight": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.54.gate_proj.weight_scale": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.54.up_proj.weight": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.54.up_proj.weight_scale": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.55.down_proj.weight": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.55.down_proj.weight_scale": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.55.gate_proj.weight": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.55.gate_proj.weight_scale": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.55.up_proj.weight": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.55.up_proj.weight_scale": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.56.down_proj.weight": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.56.down_proj.weight_scale": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.56.gate_proj.weight": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.56.gate_proj.weight_scale": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.56.up_proj.weight": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.56.up_proj.weight_scale": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.57.down_proj.weight": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.57.down_proj.weight_scale": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.57.gate_proj.weight": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.57.gate_proj.weight_scale": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.57.up_proj.weight": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.57.up_proj.weight_scale": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.58.down_proj.weight": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.58.down_proj.weight_scale": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.58.gate_proj.weight": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.58.gate_proj.weight_scale": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.58.up_proj.weight": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.58.up_proj.weight_scale": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.59.down_proj.weight": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.59.down_proj.weight_scale": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.59.gate_proj.weight": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.59.gate_proj.weight_scale": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.59.up_proj.weight": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.59.up_proj.weight_scale": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.6.down_proj.weight": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.6.down_proj.weight_scale": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.6.gate_proj.weight": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.6.gate_proj.weight_scale": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.6.up_proj.weight": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.6.up_proj.weight_scale": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.60.down_proj.weight": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.60.down_proj.weight_scale": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.60.gate_proj.weight": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.60.gate_proj.weight_scale": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.60.up_proj.weight": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.60.up_proj.weight_scale": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.61.down_proj.weight": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.61.down_proj.weight_scale": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.61.gate_proj.weight": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.61.gate_proj.weight_scale": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.61.up_proj.weight": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.61.up_proj.weight_scale": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.62.down_proj.weight": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.62.down_proj.weight_scale": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.62.gate_proj.weight": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.62.gate_proj.weight_scale": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.62.up_proj.weight": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.62.up_proj.weight_scale": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.63.down_proj.weight": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.63.down_proj.weight_scale": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.63.gate_proj.weight": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.63.gate_proj.weight_scale": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.63.up_proj.weight": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.63.up_proj.weight_scale": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.64.down_proj.weight": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.64.down_proj.weight_scale": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.64.gate_proj.weight": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.64.gate_proj.weight_scale": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.64.up_proj.weight": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.64.up_proj.weight_scale": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.65.down_proj.weight": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.65.down_proj.weight_scale": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.65.gate_proj.weight": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.65.gate_proj.weight_scale": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.65.up_proj.weight": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.65.up_proj.weight_scale": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.66.down_proj.weight": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.66.down_proj.weight_scale": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.66.gate_proj.weight": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.66.gate_proj.weight_scale": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.66.up_proj.weight": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.66.up_proj.weight_scale": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.67.down_proj.weight": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.67.down_proj.weight_scale": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.67.gate_proj.weight": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.67.gate_proj.weight_scale": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.67.up_proj.weight": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.67.up_proj.weight_scale": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.68.down_proj.weight": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.68.down_proj.weight_scale": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.68.gate_proj.weight": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.68.gate_proj.weight_scale": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.68.up_proj.weight": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.68.up_proj.weight_scale": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.69.down_proj.weight": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.69.down_proj.weight_scale": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.69.gate_proj.weight": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.69.gate_proj.weight_scale": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.69.up_proj.weight": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.69.up_proj.weight_scale": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.7.down_proj.weight": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.7.down_proj.weight_scale": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.7.gate_proj.weight": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.7.gate_proj.weight_scale": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.7.up_proj.weight": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.7.up_proj.weight_scale": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.70.down_proj.weight": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.70.down_proj.weight_scale": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.70.gate_proj.weight": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.70.gate_proj.weight_scale": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.70.up_proj.weight": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.70.up_proj.weight_scale": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.71.down_proj.weight": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.71.down_proj.weight_scale": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.71.gate_proj.weight": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.71.gate_proj.weight_scale": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.71.up_proj.weight": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.71.up_proj.weight_scale": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.72.down_proj.weight": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.72.down_proj.weight_scale": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.72.gate_proj.weight": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.72.gate_proj.weight_scale": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.72.up_proj.weight": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.72.up_proj.weight_scale": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.73.down_proj.weight": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.73.down_proj.weight_scale": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.73.gate_proj.weight": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.73.gate_proj.weight_scale": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.73.up_proj.weight": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.73.up_proj.weight_scale": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.74.down_proj.weight": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.74.down_proj.weight_scale": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.74.gate_proj.weight": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.74.gate_proj.weight_scale": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.74.up_proj.weight": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.74.up_proj.weight_scale": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.75.down_proj.weight": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.75.down_proj.weight_scale": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.75.gate_proj.weight": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.75.gate_proj.weight_scale": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.75.up_proj.weight": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.75.up_proj.weight_scale": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.76.down_proj.weight": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.76.down_proj.weight_scale": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.76.gate_proj.weight": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.76.gate_proj.weight_scale": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.76.up_proj.weight": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.76.up_proj.weight_scale": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.77.down_proj.weight": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.77.down_proj.weight_scale": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.77.gate_proj.weight": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.77.gate_proj.weight_scale": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.77.up_proj.weight": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.77.up_proj.weight_scale": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.78.down_proj.weight": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.78.down_proj.weight_scale": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.78.gate_proj.weight": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.78.gate_proj.weight_scale": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.78.up_proj.weight": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.78.up_proj.weight_scale": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.79.down_proj.weight": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.79.down_proj.weight_scale": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.79.gate_proj.weight": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.79.gate_proj.weight_scale": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.79.up_proj.weight": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.79.up_proj.weight_scale": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.8.down_proj.weight": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.8.down_proj.weight_scale": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.8.gate_proj.weight": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.8.gate_proj.weight_scale": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.8.up_proj.weight": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.8.up_proj.weight_scale": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.80.down_proj.weight": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.80.down_proj.weight_scale": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.80.gate_proj.weight": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.80.gate_proj.weight_scale": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.80.up_proj.weight": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.80.up_proj.weight_scale": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.81.down_proj.weight": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.81.down_proj.weight_scale": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.81.gate_proj.weight": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.81.gate_proj.weight_scale": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.81.up_proj.weight": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.81.up_proj.weight_scale": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.82.down_proj.weight": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.82.down_proj.weight_scale": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.82.gate_proj.weight": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.82.gate_proj.weight_scale": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.82.up_proj.weight": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.82.up_proj.weight_scale": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.83.down_proj.weight": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.83.down_proj.weight_scale": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.83.gate_proj.weight": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.83.gate_proj.weight_scale": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.83.up_proj.weight": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.83.up_proj.weight_scale": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.84.down_proj.weight": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.84.down_proj.weight_scale": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.84.gate_proj.weight": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.84.gate_proj.weight_scale": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.84.up_proj.weight": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.84.up_proj.weight_scale": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.85.down_proj.weight": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.85.down_proj.weight_scale": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.85.gate_proj.weight": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.85.gate_proj.weight_scale": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.85.up_proj.weight": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.85.up_proj.weight_scale": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.86.down_proj.weight": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.86.down_proj.weight_scale": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.86.gate_proj.weight": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.86.gate_proj.weight_scale": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.86.up_proj.weight": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.86.up_proj.weight_scale": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.87.down_proj.weight": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.87.down_proj.weight_scale": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.87.gate_proj.weight": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.87.gate_proj.weight_scale": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.87.up_proj.weight": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.87.up_proj.weight_scale": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.88.down_proj.weight": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.88.down_proj.weight_scale": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.88.gate_proj.weight": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.88.gate_proj.weight_scale": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.88.up_proj.weight": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.88.up_proj.weight_scale": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.89.down_proj.weight": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.89.down_proj.weight_scale": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.89.gate_proj.weight": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.89.gate_proj.weight_scale": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.89.up_proj.weight": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.89.up_proj.weight_scale": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.9.down_proj.weight": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.9.down_proj.weight_scale": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.9.gate_proj.weight": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.9.gate_proj.weight_scale": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.9.up_proj.weight": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.9.up_proj.weight_scale": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.90.down_proj.weight": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.90.down_proj.weight_scale": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.90.gate_proj.weight": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.90.gate_proj.weight_scale": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.90.up_proj.weight": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.90.up_proj.weight_scale": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.91.down_proj.weight": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.91.down_proj.weight_scale": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.91.gate_proj.weight": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.91.gate_proj.weight_scale": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.91.up_proj.weight": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.91.up_proj.weight_scale": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.92.down_proj.weight": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.92.down_proj.weight_scale": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.92.gate_proj.weight": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.92.gate_proj.weight_scale": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.92.up_proj.weight": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.92.up_proj.weight_scale": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.93.down_proj.weight": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.93.down_proj.weight_scale": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.93.gate_proj.weight": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.93.gate_proj.weight_scale": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.93.up_proj.weight": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.93.up_proj.weight_scale": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.94.down_proj.weight": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.94.down_proj.weight_scale": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.94.gate_proj.weight": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.94.gate_proj.weight_scale": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.94.up_proj.weight": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.94.up_proj.weight_scale": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.95.down_proj.weight": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.95.down_proj.weight_scale": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.95.gate_proj.weight": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.95.gate_proj.weight_scale": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.95.up_proj.weight": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.95.up_proj.weight_scale": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.96.down_proj.weight": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.96.down_proj.weight_scale": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.96.gate_proj.weight": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.96.gate_proj.weight_scale": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.96.up_proj.weight": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.96.up_proj.weight_scale": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.97.down_proj.weight": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.97.down_proj.weight_scale": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.97.gate_proj.weight": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.97.gate_proj.weight_scale": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.97.up_proj.weight": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.97.up_proj.weight_scale": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.98.down_proj.weight": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.98.down_proj.weight_scale": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.98.gate_proj.weight": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.98.gate_proj.weight_scale": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.98.up_proj.weight": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.98.up_proj.weight_scale": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.99.down_proj.weight": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.99.down_proj.weight_scale": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.99.gate_proj.weight": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.99.gate_proj.weight_scale": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.99.up_proj.weight": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.99.up_proj.weight_scale": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.gate.e_score_correction_bias": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.gate.weight": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.shared_experts.down_proj.weight": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.shared_experts.down_proj.weight_scale": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.shared_experts.gate_proj.weight": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.shared_experts.gate_proj.weight_scale": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.shared_experts.up_proj.weight": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.shared_experts.up_proj.weight_scale": "model-00015-of-00092.safetensors",
+ "model.layers.14.post_attention_layernorm.weight": "model-00015-of-00092.safetensors",
+ "model.layers.14.self_attn.k_norm.weight": "model-00015-of-00092.safetensors",
+ "model.layers.14.self_attn.k_proj.bias": "model-00015-of-00092.safetensors",
+ "model.layers.14.self_attn.k_proj.weight": "model-00015-of-00092.safetensors",
+ "model.layers.14.self_attn.k_proj.weight_scale": "model-00015-of-00092.safetensors",
+ "model.layers.14.self_attn.o_proj.weight": "model-00015-of-00092.safetensors",
+ "model.layers.14.self_attn.o_proj.weight_scale": "model-00015-of-00092.safetensors",
+ "model.layers.14.self_attn.q_norm.weight": "model-00015-of-00092.safetensors",
+ "model.layers.14.self_attn.q_proj.bias": "model-00015-of-00092.safetensors",
+ "model.layers.14.self_attn.q_proj.weight": "model-00015-of-00092.safetensors",
+ "model.layers.14.self_attn.q_proj.weight_scale": "model-00015-of-00092.safetensors",
+ "model.layers.14.self_attn.v_proj.bias": "model-00015-of-00092.safetensors",
+ "model.layers.14.self_attn.v_proj.weight": "model-00015-of-00092.safetensors",
+ "model.layers.14.self_attn.v_proj.weight_scale": "model-00015-of-00092.safetensors",
+ "model.layers.15.input_layernorm.weight": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.0.down_proj.weight": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.0.down_proj.weight_scale": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.0.gate_proj.weight": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.0.gate_proj.weight_scale": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.0.up_proj.weight": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.0.up_proj.weight_scale": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.1.down_proj.weight": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.1.down_proj.weight_scale": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.1.gate_proj.weight": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.1.gate_proj.weight_scale": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.1.up_proj.weight": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.1.up_proj.weight_scale": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.10.down_proj.weight": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.10.down_proj.weight_scale": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.10.gate_proj.weight": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.10.gate_proj.weight_scale": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.10.up_proj.weight": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.10.up_proj.weight_scale": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.100.down_proj.weight": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.100.down_proj.weight_scale": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.100.gate_proj.weight": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.100.gate_proj.weight_scale": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.100.up_proj.weight": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.100.up_proj.weight_scale": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.101.down_proj.weight": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.101.down_proj.weight_scale": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.101.gate_proj.weight": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.101.gate_proj.weight_scale": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.101.up_proj.weight": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.101.up_proj.weight_scale": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.102.down_proj.weight": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.102.down_proj.weight_scale": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.102.gate_proj.weight": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.102.gate_proj.weight_scale": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.102.up_proj.weight": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.102.up_proj.weight_scale": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.103.down_proj.weight": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.103.down_proj.weight_scale": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.103.gate_proj.weight": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.103.gate_proj.weight_scale": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.103.up_proj.weight": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.103.up_proj.weight_scale": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.104.down_proj.weight": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.104.down_proj.weight_scale": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.104.gate_proj.weight": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.104.gate_proj.weight_scale": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.104.up_proj.weight": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.104.up_proj.weight_scale": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.105.down_proj.weight": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.105.down_proj.weight_scale": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.105.gate_proj.weight": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.105.gate_proj.weight_scale": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.105.up_proj.weight": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.105.up_proj.weight_scale": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.106.down_proj.weight": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.106.down_proj.weight_scale": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.106.gate_proj.weight": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.106.gate_proj.weight_scale": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.106.up_proj.weight": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.106.up_proj.weight_scale": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.107.down_proj.weight": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.107.down_proj.weight_scale": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.107.gate_proj.weight": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.107.gate_proj.weight_scale": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.107.up_proj.weight": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.107.up_proj.weight_scale": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.108.down_proj.weight": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.108.down_proj.weight_scale": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.108.gate_proj.weight": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.108.gate_proj.weight_scale": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.108.up_proj.weight": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.108.up_proj.weight_scale": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.109.down_proj.weight": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.109.down_proj.weight_scale": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.109.gate_proj.weight": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.109.gate_proj.weight_scale": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.109.up_proj.weight": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.109.up_proj.weight_scale": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.11.down_proj.weight": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.11.down_proj.weight_scale": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.11.gate_proj.weight": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.11.gate_proj.weight_scale": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.11.up_proj.weight": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.11.up_proj.weight_scale": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.110.down_proj.weight": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.110.down_proj.weight_scale": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.110.gate_proj.weight": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.110.gate_proj.weight_scale": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.110.up_proj.weight": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.110.up_proj.weight_scale": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.111.down_proj.weight": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.111.down_proj.weight_scale": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.111.gate_proj.weight": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.111.gate_proj.weight_scale": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.111.up_proj.weight": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.111.up_proj.weight_scale": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.112.down_proj.weight": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.112.down_proj.weight_scale": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.112.gate_proj.weight": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.112.gate_proj.weight_scale": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.112.up_proj.weight": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.112.up_proj.weight_scale": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.113.down_proj.weight": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.113.down_proj.weight_scale": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.113.gate_proj.weight": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.113.gate_proj.weight_scale": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.113.up_proj.weight": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.113.up_proj.weight_scale": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.114.down_proj.weight": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.114.down_proj.weight_scale": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.114.gate_proj.weight": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.114.gate_proj.weight_scale": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.114.up_proj.weight": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.114.up_proj.weight_scale": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.115.down_proj.weight": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.115.down_proj.weight_scale": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.115.gate_proj.weight": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.115.gate_proj.weight_scale": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.115.up_proj.weight": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.115.up_proj.weight_scale": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.116.down_proj.weight": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.116.down_proj.weight_scale": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.116.gate_proj.weight": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.116.gate_proj.weight_scale": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.116.up_proj.weight": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.116.up_proj.weight_scale": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.117.down_proj.weight": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.117.down_proj.weight_scale": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.117.gate_proj.weight": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.117.gate_proj.weight_scale": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.117.up_proj.weight": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.117.up_proj.weight_scale": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.118.down_proj.weight": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.118.down_proj.weight_scale": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.118.gate_proj.weight": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.118.gate_proj.weight_scale": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.118.up_proj.weight": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.118.up_proj.weight_scale": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.119.down_proj.weight": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.119.down_proj.weight_scale": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.119.gate_proj.weight": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.119.gate_proj.weight_scale": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.119.up_proj.weight": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.119.up_proj.weight_scale": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.12.down_proj.weight": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.12.down_proj.weight_scale": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.12.gate_proj.weight": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.12.gate_proj.weight_scale": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.12.up_proj.weight": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.12.up_proj.weight_scale": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.120.down_proj.weight": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.120.down_proj.weight_scale": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.120.gate_proj.weight": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.120.gate_proj.weight_scale": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.120.up_proj.weight": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.120.up_proj.weight_scale": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.121.down_proj.weight": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.121.down_proj.weight_scale": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.121.gate_proj.weight": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.121.gate_proj.weight_scale": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.121.up_proj.weight": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.121.up_proj.weight_scale": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.122.down_proj.weight": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.122.down_proj.weight_scale": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.122.gate_proj.weight": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.122.gate_proj.weight_scale": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.122.up_proj.weight": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.122.up_proj.weight_scale": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.123.down_proj.weight": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.123.down_proj.weight_scale": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.123.gate_proj.weight": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.123.gate_proj.weight_scale": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.123.up_proj.weight": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.123.up_proj.weight_scale": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.124.down_proj.weight": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.124.down_proj.weight_scale": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.124.gate_proj.weight": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.124.gate_proj.weight_scale": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.124.up_proj.weight": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.124.up_proj.weight_scale": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.125.down_proj.weight": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.125.down_proj.weight_scale": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.125.gate_proj.weight": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.125.gate_proj.weight_scale": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.125.up_proj.weight": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.125.up_proj.weight_scale": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.126.down_proj.weight": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.126.down_proj.weight_scale": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.126.gate_proj.weight": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.126.gate_proj.weight_scale": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.126.up_proj.weight": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.126.up_proj.weight_scale": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.127.down_proj.weight": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.127.down_proj.weight_scale": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.127.gate_proj.weight": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.127.gate_proj.weight_scale": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.127.up_proj.weight": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.127.up_proj.weight_scale": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.128.down_proj.weight": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.128.down_proj.weight_scale": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.128.gate_proj.weight": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.128.gate_proj.weight_scale": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.128.up_proj.weight": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.128.up_proj.weight_scale": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.129.down_proj.weight": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.129.down_proj.weight_scale": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.129.gate_proj.weight": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.129.gate_proj.weight_scale": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.129.up_proj.weight": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.129.up_proj.weight_scale": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.13.down_proj.weight": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.13.down_proj.weight_scale": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.13.gate_proj.weight": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.13.gate_proj.weight_scale": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.13.up_proj.weight": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.13.up_proj.weight_scale": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.130.down_proj.weight": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.130.down_proj.weight_scale": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.130.gate_proj.weight": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.130.gate_proj.weight_scale": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.130.up_proj.weight": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.130.up_proj.weight_scale": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.131.down_proj.weight": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.131.down_proj.weight_scale": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.131.gate_proj.weight": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.131.gate_proj.weight_scale": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.131.up_proj.weight": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.131.up_proj.weight_scale": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.132.down_proj.weight": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.132.down_proj.weight_scale": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.132.gate_proj.weight": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.132.gate_proj.weight_scale": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.132.up_proj.weight": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.132.up_proj.weight_scale": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.133.down_proj.weight": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.133.down_proj.weight_scale": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.133.gate_proj.weight": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.133.gate_proj.weight_scale": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.133.up_proj.weight": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.133.up_proj.weight_scale": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.134.down_proj.weight": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.134.down_proj.weight_scale": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.134.gate_proj.weight": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.134.gate_proj.weight_scale": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.134.up_proj.weight": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.134.up_proj.weight_scale": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.135.down_proj.weight": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.135.down_proj.weight_scale": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.135.gate_proj.weight": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.135.gate_proj.weight_scale": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.135.up_proj.weight": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.135.up_proj.weight_scale": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.136.down_proj.weight": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.136.down_proj.weight_scale": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.136.gate_proj.weight": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.136.gate_proj.weight_scale": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.136.up_proj.weight": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.136.up_proj.weight_scale": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.137.down_proj.weight": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.137.down_proj.weight_scale": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.137.gate_proj.weight": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.137.gate_proj.weight_scale": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.137.up_proj.weight": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.137.up_proj.weight_scale": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.138.down_proj.weight": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.138.down_proj.weight_scale": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.138.gate_proj.weight": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.138.gate_proj.weight_scale": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.138.up_proj.weight": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.138.up_proj.weight_scale": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.139.down_proj.weight": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.139.down_proj.weight_scale": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.139.gate_proj.weight": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.139.gate_proj.weight_scale": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.139.up_proj.weight": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.139.up_proj.weight_scale": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.14.down_proj.weight": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.14.down_proj.weight_scale": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.14.gate_proj.weight": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.14.gate_proj.weight_scale": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.14.up_proj.weight": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.14.up_proj.weight_scale": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.140.down_proj.weight": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.140.down_proj.weight_scale": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.140.gate_proj.weight": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.140.gate_proj.weight_scale": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.140.up_proj.weight": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.140.up_proj.weight_scale": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.141.down_proj.weight": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.141.down_proj.weight_scale": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.141.gate_proj.weight": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.141.gate_proj.weight_scale": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.141.up_proj.weight": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.141.up_proj.weight_scale": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.142.down_proj.weight": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.142.down_proj.weight_scale": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.142.gate_proj.weight": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.142.gate_proj.weight_scale": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.142.up_proj.weight": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.142.up_proj.weight_scale": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.143.down_proj.weight": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.143.down_proj.weight_scale": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.143.gate_proj.weight": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.143.gate_proj.weight_scale": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.143.up_proj.weight": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.143.up_proj.weight_scale": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.144.down_proj.weight": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.144.down_proj.weight_scale": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.144.gate_proj.weight": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.144.gate_proj.weight_scale": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.144.up_proj.weight": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.144.up_proj.weight_scale": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.145.down_proj.weight": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.145.down_proj.weight_scale": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.145.gate_proj.weight": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.145.gate_proj.weight_scale": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.145.up_proj.weight": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.145.up_proj.weight_scale": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.146.down_proj.weight": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.146.down_proj.weight_scale": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.146.gate_proj.weight": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.146.gate_proj.weight_scale": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.146.up_proj.weight": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.146.up_proj.weight_scale": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.147.down_proj.weight": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.147.down_proj.weight_scale": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.147.gate_proj.weight": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.147.gate_proj.weight_scale": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.147.up_proj.weight": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.147.up_proj.weight_scale": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.148.down_proj.weight": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.148.down_proj.weight_scale": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.148.gate_proj.weight": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.148.gate_proj.weight_scale": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.148.up_proj.weight": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.148.up_proj.weight_scale": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.149.down_proj.weight": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.149.down_proj.weight_scale": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.149.gate_proj.weight": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.149.gate_proj.weight_scale": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.149.up_proj.weight": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.149.up_proj.weight_scale": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.15.down_proj.weight": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.15.down_proj.weight_scale": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.15.gate_proj.weight": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.15.gate_proj.weight_scale": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.15.up_proj.weight": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.15.up_proj.weight_scale": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.150.down_proj.weight": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.150.down_proj.weight_scale": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.150.gate_proj.weight": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.150.gate_proj.weight_scale": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.150.up_proj.weight": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.150.up_proj.weight_scale": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.151.down_proj.weight": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.151.down_proj.weight_scale": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.151.gate_proj.weight": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.151.gate_proj.weight_scale": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.151.up_proj.weight": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.151.up_proj.weight_scale": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.152.down_proj.weight": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.152.down_proj.weight_scale": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.152.gate_proj.weight": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.152.gate_proj.weight_scale": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.152.up_proj.weight": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.152.up_proj.weight_scale": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.153.down_proj.weight": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.153.down_proj.weight_scale": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.153.gate_proj.weight": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.153.gate_proj.weight_scale": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.153.up_proj.weight": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.153.up_proj.weight_scale": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.154.down_proj.weight": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.154.down_proj.weight_scale": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.154.gate_proj.weight": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.154.gate_proj.weight_scale": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.154.up_proj.weight": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.154.up_proj.weight_scale": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.155.down_proj.weight": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.155.down_proj.weight_scale": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.155.gate_proj.weight": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.155.gate_proj.weight_scale": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.155.up_proj.weight": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.155.up_proj.weight_scale": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.156.down_proj.weight": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.156.down_proj.weight_scale": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.156.gate_proj.weight": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.156.gate_proj.weight_scale": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.156.up_proj.weight": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.156.up_proj.weight_scale": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.157.down_proj.weight": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.157.down_proj.weight_scale": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.157.gate_proj.weight": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.157.gate_proj.weight_scale": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.157.up_proj.weight": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.157.up_proj.weight_scale": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.158.down_proj.weight": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.158.down_proj.weight_scale": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.158.gate_proj.weight": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.158.gate_proj.weight_scale": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.158.up_proj.weight": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.158.up_proj.weight_scale": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.159.down_proj.weight": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.159.down_proj.weight_scale": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.159.gate_proj.weight": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.159.gate_proj.weight_scale": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.159.up_proj.weight": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.159.up_proj.weight_scale": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.16.down_proj.weight": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.16.down_proj.weight_scale": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.16.gate_proj.weight": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.16.gate_proj.weight_scale": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.16.up_proj.weight": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.16.up_proj.weight_scale": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.17.down_proj.weight": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.17.down_proj.weight_scale": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.17.gate_proj.weight": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.17.gate_proj.weight_scale": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.17.up_proj.weight": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.17.up_proj.weight_scale": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.18.down_proj.weight": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.18.down_proj.weight_scale": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.18.gate_proj.weight": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.18.gate_proj.weight_scale": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.18.up_proj.weight": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.18.up_proj.weight_scale": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.19.down_proj.weight": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.19.down_proj.weight_scale": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.19.gate_proj.weight": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.19.gate_proj.weight_scale": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.19.up_proj.weight": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.19.up_proj.weight_scale": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.2.down_proj.weight": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.2.down_proj.weight_scale": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.2.gate_proj.weight": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.2.gate_proj.weight_scale": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.2.up_proj.weight": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.2.up_proj.weight_scale": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.20.down_proj.weight": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.20.down_proj.weight_scale": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.20.gate_proj.weight": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.20.gate_proj.weight_scale": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.20.up_proj.weight": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.20.up_proj.weight_scale": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.21.down_proj.weight": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.21.down_proj.weight_scale": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.21.gate_proj.weight": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.21.gate_proj.weight_scale": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.21.up_proj.weight": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.21.up_proj.weight_scale": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.22.down_proj.weight": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.22.down_proj.weight_scale": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.22.gate_proj.weight": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.22.gate_proj.weight_scale": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.22.up_proj.weight": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.22.up_proj.weight_scale": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.23.down_proj.weight": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.23.down_proj.weight_scale": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.23.gate_proj.weight": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.23.gate_proj.weight_scale": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.23.up_proj.weight": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.23.up_proj.weight_scale": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.24.down_proj.weight": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.24.down_proj.weight_scale": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.24.gate_proj.weight": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.24.gate_proj.weight_scale": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.24.up_proj.weight": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.24.up_proj.weight_scale": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.25.down_proj.weight": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.25.down_proj.weight_scale": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.25.gate_proj.weight": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.25.gate_proj.weight_scale": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.25.up_proj.weight": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.25.up_proj.weight_scale": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.26.down_proj.weight": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.26.down_proj.weight_scale": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.26.gate_proj.weight": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.26.gate_proj.weight_scale": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.26.up_proj.weight": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.26.up_proj.weight_scale": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.27.down_proj.weight": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.27.down_proj.weight_scale": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.27.gate_proj.weight": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.27.gate_proj.weight_scale": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.27.up_proj.weight": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.27.up_proj.weight_scale": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.28.down_proj.weight": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.28.down_proj.weight_scale": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.28.gate_proj.weight": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.28.gate_proj.weight_scale": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.28.up_proj.weight": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.28.up_proj.weight_scale": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.29.down_proj.weight": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.29.down_proj.weight_scale": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.29.gate_proj.weight": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.29.gate_proj.weight_scale": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.29.up_proj.weight": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.29.up_proj.weight_scale": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.3.down_proj.weight": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.3.down_proj.weight_scale": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.3.gate_proj.weight": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.3.gate_proj.weight_scale": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.3.up_proj.weight": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.3.up_proj.weight_scale": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.30.down_proj.weight": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.30.down_proj.weight_scale": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.30.gate_proj.weight": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.30.gate_proj.weight_scale": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.30.up_proj.weight": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.30.up_proj.weight_scale": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.31.down_proj.weight": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.31.down_proj.weight_scale": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.31.gate_proj.weight": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.31.gate_proj.weight_scale": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.31.up_proj.weight": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.31.up_proj.weight_scale": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.32.down_proj.weight": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.32.down_proj.weight_scale": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.32.gate_proj.weight": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.32.gate_proj.weight_scale": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.32.up_proj.weight": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.32.up_proj.weight_scale": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.33.down_proj.weight": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.33.down_proj.weight_scale": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.33.gate_proj.weight": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.33.gate_proj.weight_scale": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.33.up_proj.weight": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.33.up_proj.weight_scale": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.34.down_proj.weight": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.34.down_proj.weight_scale": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.34.gate_proj.weight": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.34.gate_proj.weight_scale": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.34.up_proj.weight": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.34.up_proj.weight_scale": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.35.down_proj.weight": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.35.down_proj.weight_scale": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.35.gate_proj.weight": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.35.gate_proj.weight_scale": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.35.up_proj.weight": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.35.up_proj.weight_scale": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.36.down_proj.weight": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.36.down_proj.weight_scale": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.36.gate_proj.weight": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.36.gate_proj.weight_scale": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.36.up_proj.weight": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.36.up_proj.weight_scale": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.37.down_proj.weight": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.37.down_proj.weight_scale": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.37.gate_proj.weight": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.37.gate_proj.weight_scale": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.37.up_proj.weight": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.37.up_proj.weight_scale": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.38.down_proj.weight": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.38.down_proj.weight_scale": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.38.gate_proj.weight": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.38.gate_proj.weight_scale": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.38.up_proj.weight": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.38.up_proj.weight_scale": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.39.down_proj.weight": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.39.down_proj.weight_scale": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.39.gate_proj.weight": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.39.gate_proj.weight_scale": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.39.up_proj.weight": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.39.up_proj.weight_scale": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.4.down_proj.weight": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.4.down_proj.weight_scale": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.4.gate_proj.weight": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.4.gate_proj.weight_scale": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.4.up_proj.weight": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.4.up_proj.weight_scale": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.40.down_proj.weight": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.40.down_proj.weight_scale": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.40.gate_proj.weight": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.40.gate_proj.weight_scale": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.40.up_proj.weight": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.40.up_proj.weight_scale": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.41.down_proj.weight": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.41.down_proj.weight_scale": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.41.gate_proj.weight": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.41.gate_proj.weight_scale": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.41.up_proj.weight": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.41.up_proj.weight_scale": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.42.down_proj.weight": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.42.down_proj.weight_scale": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.42.gate_proj.weight": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.42.gate_proj.weight_scale": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.42.up_proj.weight": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.42.up_proj.weight_scale": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.43.down_proj.weight": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.43.down_proj.weight_scale": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.43.gate_proj.weight": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.43.gate_proj.weight_scale": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.43.up_proj.weight": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.43.up_proj.weight_scale": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.44.down_proj.weight": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.44.down_proj.weight_scale": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.44.gate_proj.weight": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.44.gate_proj.weight_scale": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.44.up_proj.weight": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.44.up_proj.weight_scale": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.45.down_proj.weight": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.45.down_proj.weight_scale": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.45.gate_proj.weight": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.45.gate_proj.weight_scale": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.45.up_proj.weight": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.45.up_proj.weight_scale": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.46.down_proj.weight": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.46.down_proj.weight_scale": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.46.gate_proj.weight": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.46.gate_proj.weight_scale": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.46.up_proj.weight": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.46.up_proj.weight_scale": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.47.down_proj.weight": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.47.down_proj.weight_scale": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.47.gate_proj.weight": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.47.gate_proj.weight_scale": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.47.up_proj.weight": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.47.up_proj.weight_scale": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.48.down_proj.weight": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.48.down_proj.weight_scale": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.48.gate_proj.weight": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.48.gate_proj.weight_scale": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.48.up_proj.weight": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.48.up_proj.weight_scale": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.49.down_proj.weight": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.49.down_proj.weight_scale": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.49.gate_proj.weight": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.49.gate_proj.weight_scale": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.49.up_proj.weight": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.49.up_proj.weight_scale": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.5.down_proj.weight": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.5.down_proj.weight_scale": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.5.gate_proj.weight": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.5.gate_proj.weight_scale": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.5.up_proj.weight": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.5.up_proj.weight_scale": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.50.down_proj.weight": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.50.down_proj.weight_scale": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.50.gate_proj.weight": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.50.gate_proj.weight_scale": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.50.up_proj.weight": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.50.up_proj.weight_scale": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.51.down_proj.weight": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.51.down_proj.weight_scale": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.51.gate_proj.weight": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.51.gate_proj.weight_scale": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.51.up_proj.weight": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.51.up_proj.weight_scale": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.52.down_proj.weight": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.52.down_proj.weight_scale": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.52.gate_proj.weight": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.52.gate_proj.weight_scale": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.52.up_proj.weight": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.52.up_proj.weight_scale": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.53.down_proj.weight": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.53.down_proj.weight_scale": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.53.gate_proj.weight": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.53.gate_proj.weight_scale": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.53.up_proj.weight": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.53.up_proj.weight_scale": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.54.down_proj.weight": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.54.down_proj.weight_scale": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.54.gate_proj.weight": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.54.gate_proj.weight_scale": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.54.up_proj.weight": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.54.up_proj.weight_scale": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.55.down_proj.weight": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.55.down_proj.weight_scale": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.55.gate_proj.weight": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.55.gate_proj.weight_scale": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.55.up_proj.weight": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.55.up_proj.weight_scale": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.56.down_proj.weight": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.56.down_proj.weight_scale": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.56.gate_proj.weight": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.56.gate_proj.weight_scale": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.56.up_proj.weight": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.56.up_proj.weight_scale": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.57.down_proj.weight": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.57.down_proj.weight_scale": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.57.gate_proj.weight": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.57.gate_proj.weight_scale": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.57.up_proj.weight": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.57.up_proj.weight_scale": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.58.down_proj.weight": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.58.down_proj.weight_scale": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.58.gate_proj.weight": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.58.gate_proj.weight_scale": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.58.up_proj.weight": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.58.up_proj.weight_scale": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.59.down_proj.weight": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.59.down_proj.weight_scale": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.59.gate_proj.weight": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.59.gate_proj.weight_scale": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.59.up_proj.weight": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.59.up_proj.weight_scale": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.6.down_proj.weight": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.6.down_proj.weight_scale": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.6.gate_proj.weight": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.6.gate_proj.weight_scale": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.6.up_proj.weight": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.6.up_proj.weight_scale": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.60.down_proj.weight": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.60.down_proj.weight_scale": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.60.gate_proj.weight": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.60.gate_proj.weight_scale": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.60.up_proj.weight": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.60.up_proj.weight_scale": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.61.down_proj.weight": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.61.down_proj.weight_scale": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.61.gate_proj.weight": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.61.gate_proj.weight_scale": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.61.up_proj.weight": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.61.up_proj.weight_scale": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.62.down_proj.weight": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.62.down_proj.weight_scale": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.62.gate_proj.weight": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.62.gate_proj.weight_scale": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.62.up_proj.weight": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.62.up_proj.weight_scale": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.63.down_proj.weight": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.63.down_proj.weight_scale": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.63.gate_proj.weight": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.63.gate_proj.weight_scale": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.63.up_proj.weight": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.63.up_proj.weight_scale": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.64.down_proj.weight": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.64.down_proj.weight_scale": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.64.gate_proj.weight": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.64.gate_proj.weight_scale": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.64.up_proj.weight": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.64.up_proj.weight_scale": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.65.down_proj.weight": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.65.down_proj.weight_scale": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.65.gate_proj.weight": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.65.gate_proj.weight_scale": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.65.up_proj.weight": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.65.up_proj.weight_scale": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.66.down_proj.weight": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.66.down_proj.weight_scale": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.66.gate_proj.weight": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.66.gate_proj.weight_scale": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.66.up_proj.weight": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.66.up_proj.weight_scale": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.67.down_proj.weight": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.67.down_proj.weight_scale": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.67.gate_proj.weight": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.67.gate_proj.weight_scale": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.67.up_proj.weight": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.67.up_proj.weight_scale": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.68.down_proj.weight": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.68.down_proj.weight_scale": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.68.gate_proj.weight": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.68.gate_proj.weight_scale": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.68.up_proj.weight": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.68.up_proj.weight_scale": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.69.down_proj.weight": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.69.down_proj.weight_scale": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.69.gate_proj.weight": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.69.gate_proj.weight_scale": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.69.up_proj.weight": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.69.up_proj.weight_scale": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.7.down_proj.weight": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.7.down_proj.weight_scale": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.7.gate_proj.weight": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.7.gate_proj.weight_scale": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.7.up_proj.weight": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.7.up_proj.weight_scale": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.70.down_proj.weight": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.70.down_proj.weight_scale": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.70.gate_proj.weight": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.70.gate_proj.weight_scale": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.70.up_proj.weight": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.70.up_proj.weight_scale": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.71.down_proj.weight": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.71.down_proj.weight_scale": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.71.gate_proj.weight": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.71.gate_proj.weight_scale": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.71.up_proj.weight": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.71.up_proj.weight_scale": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.72.down_proj.weight": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.72.down_proj.weight_scale": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.72.gate_proj.weight": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.72.gate_proj.weight_scale": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.72.up_proj.weight": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.72.up_proj.weight_scale": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.73.down_proj.weight": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.73.down_proj.weight_scale": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.73.gate_proj.weight": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.73.gate_proj.weight_scale": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.73.up_proj.weight": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.73.up_proj.weight_scale": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.74.down_proj.weight": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.74.down_proj.weight_scale": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.74.gate_proj.weight": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.74.gate_proj.weight_scale": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.74.up_proj.weight": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.74.up_proj.weight_scale": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.75.down_proj.weight": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.75.down_proj.weight_scale": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.75.gate_proj.weight": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.75.gate_proj.weight_scale": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.75.up_proj.weight": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.75.up_proj.weight_scale": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.76.down_proj.weight": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.76.down_proj.weight_scale": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.76.gate_proj.weight": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.76.gate_proj.weight_scale": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.76.up_proj.weight": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.76.up_proj.weight_scale": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.77.down_proj.weight": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.77.down_proj.weight_scale": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.77.gate_proj.weight": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.77.gate_proj.weight_scale": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.77.up_proj.weight": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.77.up_proj.weight_scale": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.78.down_proj.weight": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.78.down_proj.weight_scale": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.78.gate_proj.weight": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.78.gate_proj.weight_scale": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.78.up_proj.weight": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.78.up_proj.weight_scale": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.79.down_proj.weight": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.79.down_proj.weight_scale": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.79.gate_proj.weight": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.79.gate_proj.weight_scale": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.79.up_proj.weight": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.79.up_proj.weight_scale": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.8.down_proj.weight": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.8.down_proj.weight_scale": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.8.gate_proj.weight": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.8.gate_proj.weight_scale": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.8.up_proj.weight": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.8.up_proj.weight_scale": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.80.down_proj.weight": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.80.down_proj.weight_scale": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.80.gate_proj.weight": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.80.gate_proj.weight_scale": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.80.up_proj.weight": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.80.up_proj.weight_scale": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.81.down_proj.weight": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.81.down_proj.weight_scale": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.81.gate_proj.weight": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.81.gate_proj.weight_scale": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.81.up_proj.weight": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.81.up_proj.weight_scale": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.82.down_proj.weight": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.82.down_proj.weight_scale": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.82.gate_proj.weight": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.82.gate_proj.weight_scale": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.82.up_proj.weight": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.82.up_proj.weight_scale": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.83.down_proj.weight": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.83.down_proj.weight_scale": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.83.gate_proj.weight": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.83.gate_proj.weight_scale": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.83.up_proj.weight": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.83.up_proj.weight_scale": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.84.down_proj.weight": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.84.down_proj.weight_scale": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.84.gate_proj.weight": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.84.gate_proj.weight_scale": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.84.up_proj.weight": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.84.up_proj.weight_scale": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.85.down_proj.weight": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.85.down_proj.weight_scale": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.85.gate_proj.weight": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.85.gate_proj.weight_scale": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.85.up_proj.weight": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.85.up_proj.weight_scale": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.86.down_proj.weight": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.86.down_proj.weight_scale": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.86.gate_proj.weight": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.86.gate_proj.weight_scale": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.86.up_proj.weight": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.86.up_proj.weight_scale": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.87.down_proj.weight": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.87.down_proj.weight_scale": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.87.gate_proj.weight": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.87.gate_proj.weight_scale": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.87.up_proj.weight": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.87.up_proj.weight_scale": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.88.down_proj.weight": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.88.down_proj.weight_scale": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.88.gate_proj.weight": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.88.gate_proj.weight_scale": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.88.up_proj.weight": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.88.up_proj.weight_scale": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.89.down_proj.weight": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.89.down_proj.weight_scale": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.89.gate_proj.weight": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.89.gate_proj.weight_scale": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.89.up_proj.weight": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.89.up_proj.weight_scale": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.9.down_proj.weight": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.9.down_proj.weight_scale": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.9.gate_proj.weight": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.9.gate_proj.weight_scale": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.9.up_proj.weight": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.9.up_proj.weight_scale": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.90.down_proj.weight": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.90.down_proj.weight_scale": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.90.gate_proj.weight": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.90.gate_proj.weight_scale": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.90.up_proj.weight": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.90.up_proj.weight_scale": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.91.down_proj.weight": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.91.down_proj.weight_scale": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.91.gate_proj.weight": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.91.gate_proj.weight_scale": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.91.up_proj.weight": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.91.up_proj.weight_scale": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.92.down_proj.weight": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.92.down_proj.weight_scale": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.92.gate_proj.weight": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.92.gate_proj.weight_scale": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.92.up_proj.weight": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.92.up_proj.weight_scale": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.93.down_proj.weight": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.93.down_proj.weight_scale": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.93.gate_proj.weight": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.93.gate_proj.weight_scale": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.93.up_proj.weight": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.93.up_proj.weight_scale": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.94.down_proj.weight": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.94.down_proj.weight_scale": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.94.gate_proj.weight": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.94.gate_proj.weight_scale": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.94.up_proj.weight": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.94.up_proj.weight_scale": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.95.down_proj.weight": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.95.down_proj.weight_scale": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.95.gate_proj.weight": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.95.gate_proj.weight_scale": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.95.up_proj.weight": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.95.up_proj.weight_scale": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.96.down_proj.weight": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.96.down_proj.weight_scale": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.96.gate_proj.weight": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.96.gate_proj.weight_scale": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.96.up_proj.weight": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.96.up_proj.weight_scale": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.97.down_proj.weight": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.97.down_proj.weight_scale": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.97.gate_proj.weight": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.97.gate_proj.weight_scale": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.97.up_proj.weight": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.97.up_proj.weight_scale": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.98.down_proj.weight": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.98.down_proj.weight_scale": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.98.gate_proj.weight": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.98.gate_proj.weight_scale": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.98.up_proj.weight": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.98.up_proj.weight_scale": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.99.down_proj.weight": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.99.down_proj.weight_scale": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.99.gate_proj.weight": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.99.gate_proj.weight_scale": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.99.up_proj.weight": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.99.up_proj.weight_scale": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.gate.e_score_correction_bias": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.gate.weight": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.shared_experts.down_proj.weight": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.shared_experts.down_proj.weight_scale": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.shared_experts.gate_proj.weight": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.shared_experts.gate_proj.weight_scale": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.shared_experts.up_proj.weight": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.shared_experts.up_proj.weight_scale": "model-00016-of-00092.safetensors",
+ "model.layers.15.post_attention_layernorm.weight": "model-00016-of-00092.safetensors",
+ "model.layers.15.self_attn.k_norm.weight": "model-00016-of-00092.safetensors",
+ "model.layers.15.self_attn.k_proj.bias": "model-00016-of-00092.safetensors",
+ "model.layers.15.self_attn.k_proj.weight": "model-00016-of-00092.safetensors",
+ "model.layers.15.self_attn.k_proj.weight_scale": "model-00016-of-00092.safetensors",
+ "model.layers.15.self_attn.o_proj.weight": "model-00016-of-00092.safetensors",
+ "model.layers.15.self_attn.o_proj.weight_scale": "model-00016-of-00092.safetensors",
+ "model.layers.15.self_attn.q_norm.weight": "model-00016-of-00092.safetensors",
+ "model.layers.15.self_attn.q_proj.bias": "model-00016-of-00092.safetensors",
+ "model.layers.15.self_attn.q_proj.weight": "model-00016-of-00092.safetensors",
+ "model.layers.15.self_attn.q_proj.weight_scale": "model-00016-of-00092.safetensors",
+ "model.layers.15.self_attn.v_proj.bias": "model-00016-of-00092.safetensors",
+ "model.layers.15.self_attn.v_proj.weight": "model-00016-of-00092.safetensors",
+ "model.layers.15.self_attn.v_proj.weight_scale": "model-00016-of-00092.safetensors",
+ "model.layers.16.input_layernorm.weight": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.0.down_proj.weight": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.0.down_proj.weight_scale": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.0.gate_proj.weight": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.0.gate_proj.weight_scale": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.0.up_proj.weight": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.0.up_proj.weight_scale": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.1.down_proj.weight": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.1.down_proj.weight_scale": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.1.gate_proj.weight": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.1.gate_proj.weight_scale": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.1.up_proj.weight": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.1.up_proj.weight_scale": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.10.down_proj.weight": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.10.down_proj.weight_scale": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.10.gate_proj.weight": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.10.gate_proj.weight_scale": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.10.up_proj.weight": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.10.up_proj.weight_scale": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.100.down_proj.weight": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.100.down_proj.weight_scale": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.100.gate_proj.weight": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.100.gate_proj.weight_scale": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.100.up_proj.weight": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.100.up_proj.weight_scale": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.101.down_proj.weight": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.101.down_proj.weight_scale": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.101.gate_proj.weight": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.101.gate_proj.weight_scale": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.101.up_proj.weight": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.101.up_proj.weight_scale": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.102.down_proj.weight": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.102.down_proj.weight_scale": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.102.gate_proj.weight": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.102.gate_proj.weight_scale": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.102.up_proj.weight": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.102.up_proj.weight_scale": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.103.down_proj.weight": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.103.down_proj.weight_scale": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.103.gate_proj.weight": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.103.gate_proj.weight_scale": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.103.up_proj.weight": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.103.up_proj.weight_scale": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.104.down_proj.weight": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.104.down_proj.weight_scale": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.104.gate_proj.weight": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.104.gate_proj.weight_scale": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.104.up_proj.weight": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.104.up_proj.weight_scale": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.105.down_proj.weight": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.105.down_proj.weight_scale": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.105.gate_proj.weight": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.105.gate_proj.weight_scale": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.105.up_proj.weight": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.105.up_proj.weight_scale": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.106.down_proj.weight": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.106.down_proj.weight_scale": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.106.gate_proj.weight": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.106.gate_proj.weight_scale": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.106.up_proj.weight": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.106.up_proj.weight_scale": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.107.down_proj.weight": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.107.down_proj.weight_scale": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.107.gate_proj.weight": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.107.gate_proj.weight_scale": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.107.up_proj.weight": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.107.up_proj.weight_scale": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.108.down_proj.weight": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.108.down_proj.weight_scale": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.108.gate_proj.weight": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.108.gate_proj.weight_scale": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.108.up_proj.weight": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.108.up_proj.weight_scale": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.109.down_proj.weight": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.109.down_proj.weight_scale": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.109.gate_proj.weight": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.109.gate_proj.weight_scale": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.109.up_proj.weight": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.109.up_proj.weight_scale": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.11.down_proj.weight": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.11.down_proj.weight_scale": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.11.gate_proj.weight": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.11.gate_proj.weight_scale": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.11.up_proj.weight": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.11.up_proj.weight_scale": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.110.down_proj.weight": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.110.down_proj.weight_scale": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.110.gate_proj.weight": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.110.gate_proj.weight_scale": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.110.up_proj.weight": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.110.up_proj.weight_scale": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.111.down_proj.weight": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.111.down_proj.weight_scale": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.111.gate_proj.weight": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.111.gate_proj.weight_scale": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.111.up_proj.weight": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.111.up_proj.weight_scale": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.112.down_proj.weight": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.112.down_proj.weight_scale": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.112.gate_proj.weight": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.112.gate_proj.weight_scale": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.112.up_proj.weight": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.112.up_proj.weight_scale": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.113.down_proj.weight": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.113.down_proj.weight_scale": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.113.gate_proj.weight": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.113.gate_proj.weight_scale": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.113.up_proj.weight": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.113.up_proj.weight_scale": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.114.down_proj.weight": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.114.down_proj.weight_scale": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.114.gate_proj.weight": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.114.gate_proj.weight_scale": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.114.up_proj.weight": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.114.up_proj.weight_scale": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.115.down_proj.weight": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.115.down_proj.weight_scale": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.115.gate_proj.weight": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.115.gate_proj.weight_scale": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.115.up_proj.weight": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.115.up_proj.weight_scale": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.116.down_proj.weight": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.116.down_proj.weight_scale": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.116.gate_proj.weight": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.116.gate_proj.weight_scale": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.116.up_proj.weight": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.116.up_proj.weight_scale": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.117.down_proj.weight": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.117.down_proj.weight_scale": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.117.gate_proj.weight": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.117.gate_proj.weight_scale": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.117.up_proj.weight": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.117.up_proj.weight_scale": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.118.down_proj.weight": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.118.down_proj.weight_scale": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.118.gate_proj.weight": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.118.gate_proj.weight_scale": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.118.up_proj.weight": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.118.up_proj.weight_scale": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.119.down_proj.weight": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.119.down_proj.weight_scale": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.119.gate_proj.weight": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.119.gate_proj.weight_scale": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.119.up_proj.weight": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.119.up_proj.weight_scale": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.12.down_proj.weight": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.12.down_proj.weight_scale": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.12.gate_proj.weight": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.12.gate_proj.weight_scale": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.12.up_proj.weight": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.12.up_proj.weight_scale": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.120.down_proj.weight": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.120.down_proj.weight_scale": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.120.gate_proj.weight": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.120.gate_proj.weight_scale": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.120.up_proj.weight": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.120.up_proj.weight_scale": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.121.down_proj.weight": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.121.down_proj.weight_scale": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.121.gate_proj.weight": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.121.gate_proj.weight_scale": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.121.up_proj.weight": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.121.up_proj.weight_scale": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.122.down_proj.weight": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.122.down_proj.weight_scale": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.122.gate_proj.weight": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.122.gate_proj.weight_scale": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.122.up_proj.weight": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.122.up_proj.weight_scale": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.123.down_proj.weight": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.123.down_proj.weight_scale": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.123.gate_proj.weight": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.123.gate_proj.weight_scale": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.123.up_proj.weight": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.123.up_proj.weight_scale": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.124.down_proj.weight": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.124.down_proj.weight_scale": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.124.gate_proj.weight": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.124.gate_proj.weight_scale": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.124.up_proj.weight": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.124.up_proj.weight_scale": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.125.down_proj.weight": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.125.down_proj.weight_scale": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.125.gate_proj.weight": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.125.gate_proj.weight_scale": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.125.up_proj.weight": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.125.up_proj.weight_scale": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.126.down_proj.weight": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.126.down_proj.weight_scale": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.126.gate_proj.weight": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.126.gate_proj.weight_scale": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.126.up_proj.weight": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.126.up_proj.weight_scale": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.127.down_proj.weight": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.127.down_proj.weight_scale": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.127.gate_proj.weight": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.127.gate_proj.weight_scale": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.127.up_proj.weight": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.127.up_proj.weight_scale": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.128.down_proj.weight": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.128.down_proj.weight_scale": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.128.gate_proj.weight": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.128.gate_proj.weight_scale": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.128.up_proj.weight": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.128.up_proj.weight_scale": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.129.down_proj.weight": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.129.down_proj.weight_scale": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.129.gate_proj.weight": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.129.gate_proj.weight_scale": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.129.up_proj.weight": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.129.up_proj.weight_scale": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.13.down_proj.weight": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.13.down_proj.weight_scale": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.13.gate_proj.weight": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.13.gate_proj.weight_scale": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.13.up_proj.weight": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.13.up_proj.weight_scale": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.130.down_proj.weight": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.130.down_proj.weight_scale": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.130.gate_proj.weight": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.130.gate_proj.weight_scale": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.130.up_proj.weight": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.130.up_proj.weight_scale": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.131.down_proj.weight": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.131.down_proj.weight_scale": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.131.gate_proj.weight": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.131.gate_proj.weight_scale": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.131.up_proj.weight": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.131.up_proj.weight_scale": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.132.down_proj.weight": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.132.down_proj.weight_scale": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.132.gate_proj.weight": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.132.gate_proj.weight_scale": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.132.up_proj.weight": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.132.up_proj.weight_scale": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.133.down_proj.weight": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.133.down_proj.weight_scale": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.133.gate_proj.weight": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.133.gate_proj.weight_scale": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.133.up_proj.weight": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.133.up_proj.weight_scale": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.134.down_proj.weight": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.134.down_proj.weight_scale": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.134.gate_proj.weight": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.134.gate_proj.weight_scale": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.134.up_proj.weight": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.134.up_proj.weight_scale": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.135.down_proj.weight": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.135.down_proj.weight_scale": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.135.gate_proj.weight": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.135.gate_proj.weight_scale": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.135.up_proj.weight": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.135.up_proj.weight_scale": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.136.down_proj.weight": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.136.down_proj.weight_scale": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.136.gate_proj.weight": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.136.gate_proj.weight_scale": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.136.up_proj.weight": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.136.up_proj.weight_scale": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.137.down_proj.weight": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.137.down_proj.weight_scale": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.137.gate_proj.weight": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.137.gate_proj.weight_scale": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.137.up_proj.weight": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.137.up_proj.weight_scale": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.138.down_proj.weight": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.138.down_proj.weight_scale": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.138.gate_proj.weight": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.138.gate_proj.weight_scale": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.138.up_proj.weight": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.138.up_proj.weight_scale": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.139.down_proj.weight": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.139.down_proj.weight_scale": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.139.gate_proj.weight": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.139.gate_proj.weight_scale": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.139.up_proj.weight": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.139.up_proj.weight_scale": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.14.down_proj.weight": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.14.down_proj.weight_scale": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.14.gate_proj.weight": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.14.gate_proj.weight_scale": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.14.up_proj.weight": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.14.up_proj.weight_scale": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.140.down_proj.weight": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.140.down_proj.weight_scale": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.140.gate_proj.weight": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.140.gate_proj.weight_scale": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.140.up_proj.weight": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.140.up_proj.weight_scale": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.141.down_proj.weight": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.141.down_proj.weight_scale": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.141.gate_proj.weight": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.141.gate_proj.weight_scale": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.141.up_proj.weight": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.141.up_proj.weight_scale": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.142.down_proj.weight": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.142.down_proj.weight_scale": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.142.gate_proj.weight": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.142.gate_proj.weight_scale": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.142.up_proj.weight": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.142.up_proj.weight_scale": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.143.down_proj.weight": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.143.down_proj.weight_scale": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.143.gate_proj.weight": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.143.gate_proj.weight_scale": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.143.up_proj.weight": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.143.up_proj.weight_scale": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.144.down_proj.weight": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.144.down_proj.weight_scale": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.144.gate_proj.weight": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.144.gate_proj.weight_scale": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.144.up_proj.weight": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.144.up_proj.weight_scale": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.145.down_proj.weight": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.145.down_proj.weight_scale": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.145.gate_proj.weight": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.145.gate_proj.weight_scale": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.145.up_proj.weight": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.145.up_proj.weight_scale": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.146.down_proj.weight": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.146.down_proj.weight_scale": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.146.gate_proj.weight": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.146.gate_proj.weight_scale": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.146.up_proj.weight": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.146.up_proj.weight_scale": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.147.down_proj.weight": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.147.down_proj.weight_scale": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.147.gate_proj.weight": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.147.gate_proj.weight_scale": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.147.up_proj.weight": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.147.up_proj.weight_scale": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.148.down_proj.weight": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.148.down_proj.weight_scale": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.148.gate_proj.weight": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.148.gate_proj.weight_scale": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.148.up_proj.weight": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.148.up_proj.weight_scale": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.149.down_proj.weight": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.149.down_proj.weight_scale": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.149.gate_proj.weight": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.149.gate_proj.weight_scale": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.149.up_proj.weight": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.149.up_proj.weight_scale": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.15.down_proj.weight": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.15.down_proj.weight_scale": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.15.gate_proj.weight": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.15.gate_proj.weight_scale": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.15.up_proj.weight": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.15.up_proj.weight_scale": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.150.down_proj.weight": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.150.down_proj.weight_scale": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.150.gate_proj.weight": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.150.gate_proj.weight_scale": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.150.up_proj.weight": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.150.up_proj.weight_scale": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.151.down_proj.weight": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.151.down_proj.weight_scale": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.151.gate_proj.weight": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.151.gate_proj.weight_scale": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.151.up_proj.weight": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.151.up_proj.weight_scale": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.152.down_proj.weight": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.152.down_proj.weight_scale": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.152.gate_proj.weight": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.152.gate_proj.weight_scale": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.152.up_proj.weight": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.152.up_proj.weight_scale": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.153.down_proj.weight": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.153.down_proj.weight_scale": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.153.gate_proj.weight": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.153.gate_proj.weight_scale": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.153.up_proj.weight": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.153.up_proj.weight_scale": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.154.down_proj.weight": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.154.down_proj.weight_scale": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.154.gate_proj.weight": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.154.gate_proj.weight_scale": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.154.up_proj.weight": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.154.up_proj.weight_scale": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.155.down_proj.weight": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.155.down_proj.weight_scale": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.155.gate_proj.weight": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.155.gate_proj.weight_scale": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.155.up_proj.weight": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.155.up_proj.weight_scale": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.156.down_proj.weight": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.156.down_proj.weight_scale": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.156.gate_proj.weight": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.156.gate_proj.weight_scale": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.156.up_proj.weight": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.156.up_proj.weight_scale": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.157.down_proj.weight": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.157.down_proj.weight_scale": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.157.gate_proj.weight": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.157.gate_proj.weight_scale": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.157.up_proj.weight": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.157.up_proj.weight_scale": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.158.down_proj.weight": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.158.down_proj.weight_scale": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.158.gate_proj.weight": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.158.gate_proj.weight_scale": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.158.up_proj.weight": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.158.up_proj.weight_scale": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.159.down_proj.weight": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.159.down_proj.weight_scale": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.159.gate_proj.weight": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.159.gate_proj.weight_scale": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.159.up_proj.weight": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.159.up_proj.weight_scale": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.16.down_proj.weight": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.16.down_proj.weight_scale": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.16.gate_proj.weight": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.16.gate_proj.weight_scale": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.16.up_proj.weight": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.16.up_proj.weight_scale": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.17.down_proj.weight": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.17.down_proj.weight_scale": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.17.gate_proj.weight": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.17.gate_proj.weight_scale": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.17.up_proj.weight": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.17.up_proj.weight_scale": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.18.down_proj.weight": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.18.down_proj.weight_scale": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.18.gate_proj.weight": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.18.gate_proj.weight_scale": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.18.up_proj.weight": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.18.up_proj.weight_scale": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.19.down_proj.weight": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.19.down_proj.weight_scale": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.19.gate_proj.weight": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.19.gate_proj.weight_scale": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.19.up_proj.weight": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.19.up_proj.weight_scale": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.2.down_proj.weight": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.2.down_proj.weight_scale": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.2.gate_proj.weight": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.2.gate_proj.weight_scale": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.2.up_proj.weight": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.2.up_proj.weight_scale": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.20.down_proj.weight": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.20.down_proj.weight_scale": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.20.gate_proj.weight": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.20.gate_proj.weight_scale": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.20.up_proj.weight": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.20.up_proj.weight_scale": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.21.down_proj.weight": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.21.down_proj.weight_scale": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.21.gate_proj.weight": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.21.gate_proj.weight_scale": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.21.up_proj.weight": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.21.up_proj.weight_scale": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.22.down_proj.weight": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.22.down_proj.weight_scale": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.22.gate_proj.weight": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.22.gate_proj.weight_scale": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.22.up_proj.weight": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.22.up_proj.weight_scale": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.23.down_proj.weight": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.23.down_proj.weight_scale": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.23.gate_proj.weight": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.23.gate_proj.weight_scale": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.23.up_proj.weight": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.23.up_proj.weight_scale": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.24.down_proj.weight": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.24.down_proj.weight_scale": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.24.gate_proj.weight": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.24.gate_proj.weight_scale": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.24.up_proj.weight": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.24.up_proj.weight_scale": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.25.down_proj.weight": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.25.down_proj.weight_scale": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.25.gate_proj.weight": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.25.gate_proj.weight_scale": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.25.up_proj.weight": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.25.up_proj.weight_scale": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.26.down_proj.weight": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.26.down_proj.weight_scale": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.26.gate_proj.weight": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.26.gate_proj.weight_scale": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.26.up_proj.weight": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.26.up_proj.weight_scale": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.27.down_proj.weight": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.27.down_proj.weight_scale": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.27.gate_proj.weight": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.27.gate_proj.weight_scale": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.27.up_proj.weight": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.27.up_proj.weight_scale": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.28.down_proj.weight": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.28.down_proj.weight_scale": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.28.gate_proj.weight": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.28.gate_proj.weight_scale": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.28.up_proj.weight": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.28.up_proj.weight_scale": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.29.down_proj.weight": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.29.down_proj.weight_scale": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.29.gate_proj.weight": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.29.gate_proj.weight_scale": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.29.up_proj.weight": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.29.up_proj.weight_scale": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.3.down_proj.weight": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.3.down_proj.weight_scale": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.3.gate_proj.weight": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.3.gate_proj.weight_scale": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.3.up_proj.weight": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.3.up_proj.weight_scale": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.30.down_proj.weight": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.30.down_proj.weight_scale": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.30.gate_proj.weight": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.30.gate_proj.weight_scale": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.30.up_proj.weight": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.30.up_proj.weight_scale": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.31.down_proj.weight": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.31.down_proj.weight_scale": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.31.gate_proj.weight": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.31.gate_proj.weight_scale": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.31.up_proj.weight": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.31.up_proj.weight_scale": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.32.down_proj.weight": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.32.down_proj.weight_scale": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.32.gate_proj.weight": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.32.gate_proj.weight_scale": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.32.up_proj.weight": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.32.up_proj.weight_scale": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.33.down_proj.weight": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.33.down_proj.weight_scale": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.33.gate_proj.weight": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.33.gate_proj.weight_scale": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.33.up_proj.weight": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.33.up_proj.weight_scale": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.34.down_proj.weight": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.34.down_proj.weight_scale": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.34.gate_proj.weight": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.34.gate_proj.weight_scale": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.34.up_proj.weight": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.34.up_proj.weight_scale": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.35.down_proj.weight": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.35.down_proj.weight_scale": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.35.gate_proj.weight": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.35.gate_proj.weight_scale": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.35.up_proj.weight": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.35.up_proj.weight_scale": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.36.down_proj.weight": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.36.down_proj.weight_scale": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.36.gate_proj.weight": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.36.gate_proj.weight_scale": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.36.up_proj.weight": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.36.up_proj.weight_scale": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.37.down_proj.weight": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.37.down_proj.weight_scale": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.37.gate_proj.weight": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.37.gate_proj.weight_scale": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.37.up_proj.weight": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.37.up_proj.weight_scale": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.38.down_proj.weight": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.38.down_proj.weight_scale": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.38.gate_proj.weight": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.38.gate_proj.weight_scale": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.38.up_proj.weight": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.38.up_proj.weight_scale": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.39.down_proj.weight": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.39.down_proj.weight_scale": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.39.gate_proj.weight": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.39.gate_proj.weight_scale": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.39.up_proj.weight": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.39.up_proj.weight_scale": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.4.down_proj.weight": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.4.down_proj.weight_scale": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.4.gate_proj.weight": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.4.gate_proj.weight_scale": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.4.up_proj.weight": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.4.up_proj.weight_scale": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.40.down_proj.weight": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.40.down_proj.weight_scale": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.40.gate_proj.weight": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.40.gate_proj.weight_scale": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.40.up_proj.weight": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.40.up_proj.weight_scale": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.41.down_proj.weight": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.41.down_proj.weight_scale": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.41.gate_proj.weight": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.41.gate_proj.weight_scale": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.41.up_proj.weight": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.41.up_proj.weight_scale": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.42.down_proj.weight": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.42.down_proj.weight_scale": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.42.gate_proj.weight": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.42.gate_proj.weight_scale": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.42.up_proj.weight": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.42.up_proj.weight_scale": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.43.down_proj.weight": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.43.down_proj.weight_scale": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.43.gate_proj.weight": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.43.gate_proj.weight_scale": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.43.up_proj.weight": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.43.up_proj.weight_scale": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.44.down_proj.weight": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.44.down_proj.weight_scale": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.44.gate_proj.weight": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.44.gate_proj.weight_scale": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.44.up_proj.weight": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.44.up_proj.weight_scale": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.45.down_proj.weight": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.45.down_proj.weight_scale": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.45.gate_proj.weight": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.45.gate_proj.weight_scale": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.45.up_proj.weight": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.45.up_proj.weight_scale": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.46.down_proj.weight": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.46.down_proj.weight_scale": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.46.gate_proj.weight": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.46.gate_proj.weight_scale": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.46.up_proj.weight": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.46.up_proj.weight_scale": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.47.down_proj.weight": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.47.down_proj.weight_scale": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.47.gate_proj.weight": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.47.gate_proj.weight_scale": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.47.up_proj.weight": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.47.up_proj.weight_scale": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.48.down_proj.weight": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.48.down_proj.weight_scale": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.48.gate_proj.weight": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.48.gate_proj.weight_scale": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.48.up_proj.weight": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.48.up_proj.weight_scale": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.49.down_proj.weight": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.49.down_proj.weight_scale": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.49.gate_proj.weight": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.49.gate_proj.weight_scale": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.49.up_proj.weight": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.49.up_proj.weight_scale": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.5.down_proj.weight": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.5.down_proj.weight_scale": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.5.gate_proj.weight": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.5.gate_proj.weight_scale": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.5.up_proj.weight": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.5.up_proj.weight_scale": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.50.down_proj.weight": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.50.down_proj.weight_scale": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.50.gate_proj.weight": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.50.gate_proj.weight_scale": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.50.up_proj.weight": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.50.up_proj.weight_scale": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.51.down_proj.weight": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.51.down_proj.weight_scale": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.51.gate_proj.weight": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.51.gate_proj.weight_scale": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.51.up_proj.weight": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.51.up_proj.weight_scale": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.52.down_proj.weight": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.52.down_proj.weight_scale": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.52.gate_proj.weight": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.52.gate_proj.weight_scale": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.52.up_proj.weight": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.52.up_proj.weight_scale": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.53.down_proj.weight": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.53.down_proj.weight_scale": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.53.gate_proj.weight": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.53.gate_proj.weight_scale": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.53.up_proj.weight": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.53.up_proj.weight_scale": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.54.down_proj.weight": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.54.down_proj.weight_scale": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.54.gate_proj.weight": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.54.gate_proj.weight_scale": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.54.up_proj.weight": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.54.up_proj.weight_scale": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.55.down_proj.weight": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.55.down_proj.weight_scale": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.55.gate_proj.weight": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.55.gate_proj.weight_scale": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.55.up_proj.weight": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.55.up_proj.weight_scale": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.56.down_proj.weight": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.56.down_proj.weight_scale": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.56.gate_proj.weight": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.56.gate_proj.weight_scale": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.56.up_proj.weight": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.56.up_proj.weight_scale": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.57.down_proj.weight": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.57.down_proj.weight_scale": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.57.gate_proj.weight": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.57.gate_proj.weight_scale": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.57.up_proj.weight": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.57.up_proj.weight_scale": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.58.down_proj.weight": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.58.down_proj.weight_scale": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.58.gate_proj.weight": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.58.gate_proj.weight_scale": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.58.up_proj.weight": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.58.up_proj.weight_scale": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.59.down_proj.weight": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.59.down_proj.weight_scale": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.59.gate_proj.weight": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.59.gate_proj.weight_scale": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.59.up_proj.weight": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.59.up_proj.weight_scale": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.6.down_proj.weight": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.6.down_proj.weight_scale": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.6.gate_proj.weight": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.6.gate_proj.weight_scale": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.6.up_proj.weight": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.6.up_proj.weight_scale": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.60.down_proj.weight": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.60.down_proj.weight_scale": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.60.gate_proj.weight": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.60.gate_proj.weight_scale": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.60.up_proj.weight": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.60.up_proj.weight_scale": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.61.down_proj.weight": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.61.down_proj.weight_scale": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.61.gate_proj.weight": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.61.gate_proj.weight_scale": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.61.up_proj.weight": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.61.up_proj.weight_scale": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.62.down_proj.weight": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.62.down_proj.weight_scale": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.62.gate_proj.weight": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.62.gate_proj.weight_scale": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.62.up_proj.weight": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.62.up_proj.weight_scale": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.63.down_proj.weight": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.63.down_proj.weight_scale": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.63.gate_proj.weight": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.63.gate_proj.weight_scale": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.63.up_proj.weight": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.63.up_proj.weight_scale": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.64.down_proj.weight": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.64.down_proj.weight_scale": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.64.gate_proj.weight": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.64.gate_proj.weight_scale": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.64.up_proj.weight": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.64.up_proj.weight_scale": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.65.down_proj.weight": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.65.down_proj.weight_scale": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.65.gate_proj.weight": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.65.gate_proj.weight_scale": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.65.up_proj.weight": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.65.up_proj.weight_scale": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.66.down_proj.weight": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.66.down_proj.weight_scale": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.66.gate_proj.weight": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.66.gate_proj.weight_scale": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.66.up_proj.weight": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.66.up_proj.weight_scale": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.67.down_proj.weight": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.67.down_proj.weight_scale": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.67.gate_proj.weight": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.67.gate_proj.weight_scale": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.67.up_proj.weight": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.67.up_proj.weight_scale": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.68.down_proj.weight": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.68.down_proj.weight_scale": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.68.gate_proj.weight": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.68.gate_proj.weight_scale": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.68.up_proj.weight": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.68.up_proj.weight_scale": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.69.down_proj.weight": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.69.down_proj.weight_scale": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.69.gate_proj.weight": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.69.gate_proj.weight_scale": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.69.up_proj.weight": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.69.up_proj.weight_scale": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.7.down_proj.weight": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.7.down_proj.weight_scale": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.7.gate_proj.weight": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.7.gate_proj.weight_scale": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.7.up_proj.weight": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.7.up_proj.weight_scale": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.70.down_proj.weight": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.70.down_proj.weight_scale": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.70.gate_proj.weight": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.70.gate_proj.weight_scale": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.70.up_proj.weight": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.70.up_proj.weight_scale": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.71.down_proj.weight": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.71.down_proj.weight_scale": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.71.gate_proj.weight": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.71.gate_proj.weight_scale": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.71.up_proj.weight": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.71.up_proj.weight_scale": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.72.down_proj.weight": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.72.down_proj.weight_scale": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.72.gate_proj.weight": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.72.gate_proj.weight_scale": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.72.up_proj.weight": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.72.up_proj.weight_scale": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.73.down_proj.weight": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.73.down_proj.weight_scale": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.73.gate_proj.weight": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.73.gate_proj.weight_scale": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.73.up_proj.weight": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.73.up_proj.weight_scale": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.74.down_proj.weight": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.74.down_proj.weight_scale": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.74.gate_proj.weight": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.74.gate_proj.weight_scale": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.74.up_proj.weight": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.74.up_proj.weight_scale": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.75.down_proj.weight": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.75.down_proj.weight_scale": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.75.gate_proj.weight": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.75.gate_proj.weight_scale": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.75.up_proj.weight": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.75.up_proj.weight_scale": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.76.down_proj.weight": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.76.down_proj.weight_scale": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.76.gate_proj.weight": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.76.gate_proj.weight_scale": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.76.up_proj.weight": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.76.up_proj.weight_scale": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.77.down_proj.weight": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.77.down_proj.weight_scale": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.77.gate_proj.weight": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.77.gate_proj.weight_scale": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.77.up_proj.weight": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.77.up_proj.weight_scale": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.78.down_proj.weight": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.78.down_proj.weight_scale": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.78.gate_proj.weight": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.78.gate_proj.weight_scale": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.78.up_proj.weight": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.78.up_proj.weight_scale": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.79.down_proj.weight": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.79.down_proj.weight_scale": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.79.gate_proj.weight": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.79.gate_proj.weight_scale": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.79.up_proj.weight": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.79.up_proj.weight_scale": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.8.down_proj.weight": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.8.down_proj.weight_scale": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.8.gate_proj.weight": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.8.gate_proj.weight_scale": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.8.up_proj.weight": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.8.up_proj.weight_scale": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.80.down_proj.weight": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.80.down_proj.weight_scale": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.80.gate_proj.weight": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.80.gate_proj.weight_scale": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.80.up_proj.weight": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.80.up_proj.weight_scale": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.81.down_proj.weight": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.81.down_proj.weight_scale": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.81.gate_proj.weight": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.81.gate_proj.weight_scale": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.81.up_proj.weight": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.81.up_proj.weight_scale": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.82.down_proj.weight": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.82.down_proj.weight_scale": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.82.gate_proj.weight": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.82.gate_proj.weight_scale": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.82.up_proj.weight": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.82.up_proj.weight_scale": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.83.down_proj.weight": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.83.down_proj.weight_scale": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.83.gate_proj.weight": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.83.gate_proj.weight_scale": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.83.up_proj.weight": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.83.up_proj.weight_scale": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.84.down_proj.weight": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.84.down_proj.weight_scale": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.84.gate_proj.weight": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.84.gate_proj.weight_scale": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.84.up_proj.weight": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.84.up_proj.weight_scale": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.85.down_proj.weight": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.85.down_proj.weight_scale": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.85.gate_proj.weight": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.85.gate_proj.weight_scale": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.85.up_proj.weight": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.85.up_proj.weight_scale": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.86.down_proj.weight": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.86.down_proj.weight_scale": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.86.gate_proj.weight": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.86.gate_proj.weight_scale": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.86.up_proj.weight": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.86.up_proj.weight_scale": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.87.down_proj.weight": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.87.down_proj.weight_scale": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.87.gate_proj.weight": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.87.gate_proj.weight_scale": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.87.up_proj.weight": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.87.up_proj.weight_scale": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.88.down_proj.weight": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.88.down_proj.weight_scale": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.88.gate_proj.weight": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.88.gate_proj.weight_scale": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.88.up_proj.weight": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.88.up_proj.weight_scale": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.89.down_proj.weight": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.89.down_proj.weight_scale": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.89.gate_proj.weight": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.89.gate_proj.weight_scale": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.89.up_proj.weight": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.89.up_proj.weight_scale": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.9.down_proj.weight": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.9.down_proj.weight_scale": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.9.gate_proj.weight": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.9.gate_proj.weight_scale": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.9.up_proj.weight": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.9.up_proj.weight_scale": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.90.down_proj.weight": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.90.down_proj.weight_scale": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.90.gate_proj.weight": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.90.gate_proj.weight_scale": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.90.up_proj.weight": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.90.up_proj.weight_scale": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.91.down_proj.weight": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.91.down_proj.weight_scale": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.91.gate_proj.weight": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.91.gate_proj.weight_scale": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.91.up_proj.weight": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.91.up_proj.weight_scale": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.92.down_proj.weight": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.92.down_proj.weight_scale": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.92.gate_proj.weight": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.92.gate_proj.weight_scale": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.92.up_proj.weight": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.92.up_proj.weight_scale": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.93.down_proj.weight": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.93.down_proj.weight_scale": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.93.gate_proj.weight": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.93.gate_proj.weight_scale": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.93.up_proj.weight": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.93.up_proj.weight_scale": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.94.down_proj.weight": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.94.down_proj.weight_scale": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.94.gate_proj.weight": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.94.gate_proj.weight_scale": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.94.up_proj.weight": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.94.up_proj.weight_scale": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.95.down_proj.weight": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.95.down_proj.weight_scale": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.95.gate_proj.weight": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.95.gate_proj.weight_scale": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.95.up_proj.weight": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.95.up_proj.weight_scale": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.96.down_proj.weight": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.96.down_proj.weight_scale": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.96.gate_proj.weight": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.96.gate_proj.weight_scale": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.96.up_proj.weight": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.96.up_proj.weight_scale": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.97.down_proj.weight": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.97.down_proj.weight_scale": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.97.gate_proj.weight": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.97.gate_proj.weight_scale": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.97.up_proj.weight": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.97.up_proj.weight_scale": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.98.down_proj.weight": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.98.down_proj.weight_scale": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.98.gate_proj.weight": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.98.gate_proj.weight_scale": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.98.up_proj.weight": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.98.up_proj.weight_scale": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.99.down_proj.weight": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.99.down_proj.weight_scale": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.99.gate_proj.weight": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.99.gate_proj.weight_scale": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.99.up_proj.weight": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.99.up_proj.weight_scale": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.gate.e_score_correction_bias": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.gate.weight": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.shared_experts.down_proj.weight": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.shared_experts.down_proj.weight_scale": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.shared_experts.gate_proj.weight": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.shared_experts.gate_proj.weight_scale": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.shared_experts.up_proj.weight": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.shared_experts.up_proj.weight_scale": "model-00017-of-00092.safetensors",
+ "model.layers.16.post_attention_layernorm.weight": "model-00017-of-00092.safetensors",
+ "model.layers.16.self_attn.k_norm.weight": "model-00017-of-00092.safetensors",
+ "model.layers.16.self_attn.k_proj.bias": "model-00017-of-00092.safetensors",
+ "model.layers.16.self_attn.k_proj.weight": "model-00017-of-00092.safetensors",
+ "model.layers.16.self_attn.k_proj.weight_scale": "model-00017-of-00092.safetensors",
+ "model.layers.16.self_attn.o_proj.weight": "model-00017-of-00092.safetensors",
+ "model.layers.16.self_attn.o_proj.weight_scale": "model-00017-of-00092.safetensors",
+ "model.layers.16.self_attn.q_norm.weight": "model-00017-of-00092.safetensors",
+ "model.layers.16.self_attn.q_proj.bias": "model-00017-of-00092.safetensors",
+ "model.layers.16.self_attn.q_proj.weight": "model-00017-of-00092.safetensors",
+ "model.layers.16.self_attn.q_proj.weight_scale": "model-00017-of-00092.safetensors",
+ "model.layers.16.self_attn.v_proj.bias": "model-00017-of-00092.safetensors",
+ "model.layers.16.self_attn.v_proj.weight": "model-00017-of-00092.safetensors",
+ "model.layers.16.self_attn.v_proj.weight_scale": "model-00017-of-00092.safetensors",
+ "model.layers.17.input_layernorm.weight": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.0.down_proj.weight": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.0.down_proj.weight_scale": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.0.gate_proj.weight": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.0.gate_proj.weight_scale": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.0.up_proj.weight": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.0.up_proj.weight_scale": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.1.down_proj.weight": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.1.down_proj.weight_scale": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.1.gate_proj.weight": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.1.gate_proj.weight_scale": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.1.up_proj.weight": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.1.up_proj.weight_scale": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.10.down_proj.weight": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.10.down_proj.weight_scale": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.10.gate_proj.weight": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.10.gate_proj.weight_scale": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.10.up_proj.weight": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.10.up_proj.weight_scale": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.100.down_proj.weight": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.100.down_proj.weight_scale": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.100.gate_proj.weight": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.100.gate_proj.weight_scale": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.100.up_proj.weight": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.100.up_proj.weight_scale": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.101.down_proj.weight": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.101.down_proj.weight_scale": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.101.gate_proj.weight": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.101.gate_proj.weight_scale": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.101.up_proj.weight": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.101.up_proj.weight_scale": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.102.down_proj.weight": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.102.down_proj.weight_scale": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.102.gate_proj.weight": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.102.gate_proj.weight_scale": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.102.up_proj.weight": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.102.up_proj.weight_scale": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.103.down_proj.weight": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.103.down_proj.weight_scale": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.103.gate_proj.weight": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.103.gate_proj.weight_scale": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.103.up_proj.weight": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.103.up_proj.weight_scale": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.104.down_proj.weight": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.104.down_proj.weight_scale": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.104.gate_proj.weight": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.104.gate_proj.weight_scale": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.104.up_proj.weight": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.104.up_proj.weight_scale": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.105.down_proj.weight": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.105.down_proj.weight_scale": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.105.gate_proj.weight": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.105.gate_proj.weight_scale": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.105.up_proj.weight": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.105.up_proj.weight_scale": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.106.down_proj.weight": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.106.down_proj.weight_scale": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.106.gate_proj.weight": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.106.gate_proj.weight_scale": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.106.up_proj.weight": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.106.up_proj.weight_scale": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.107.down_proj.weight": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.107.down_proj.weight_scale": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.107.gate_proj.weight": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.107.gate_proj.weight_scale": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.107.up_proj.weight": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.107.up_proj.weight_scale": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.108.down_proj.weight": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.108.down_proj.weight_scale": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.108.gate_proj.weight": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.108.gate_proj.weight_scale": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.108.up_proj.weight": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.108.up_proj.weight_scale": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.109.down_proj.weight": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.109.down_proj.weight_scale": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.109.gate_proj.weight": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.109.gate_proj.weight_scale": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.109.up_proj.weight": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.109.up_proj.weight_scale": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.11.down_proj.weight": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.11.down_proj.weight_scale": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.11.gate_proj.weight": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.11.gate_proj.weight_scale": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.11.up_proj.weight": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.11.up_proj.weight_scale": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.110.down_proj.weight": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.110.down_proj.weight_scale": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.110.gate_proj.weight": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.110.gate_proj.weight_scale": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.110.up_proj.weight": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.110.up_proj.weight_scale": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.111.down_proj.weight": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.111.down_proj.weight_scale": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.111.gate_proj.weight": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.111.gate_proj.weight_scale": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.111.up_proj.weight": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.111.up_proj.weight_scale": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.112.down_proj.weight": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.112.down_proj.weight_scale": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.112.gate_proj.weight": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.112.gate_proj.weight_scale": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.112.up_proj.weight": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.112.up_proj.weight_scale": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.113.down_proj.weight": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.113.down_proj.weight_scale": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.113.gate_proj.weight": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.113.gate_proj.weight_scale": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.113.up_proj.weight": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.113.up_proj.weight_scale": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.114.down_proj.weight": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.114.down_proj.weight_scale": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.114.gate_proj.weight": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.114.gate_proj.weight_scale": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.114.up_proj.weight": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.114.up_proj.weight_scale": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.115.down_proj.weight": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.115.down_proj.weight_scale": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.115.gate_proj.weight": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.115.gate_proj.weight_scale": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.115.up_proj.weight": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.115.up_proj.weight_scale": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.116.down_proj.weight": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.116.down_proj.weight_scale": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.116.gate_proj.weight": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.116.gate_proj.weight_scale": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.116.up_proj.weight": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.116.up_proj.weight_scale": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.117.down_proj.weight": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.117.down_proj.weight_scale": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.117.gate_proj.weight": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.117.gate_proj.weight_scale": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.117.up_proj.weight": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.117.up_proj.weight_scale": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.118.down_proj.weight": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.118.down_proj.weight_scale": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.118.gate_proj.weight": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.118.gate_proj.weight_scale": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.118.up_proj.weight": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.118.up_proj.weight_scale": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.119.down_proj.weight": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.119.down_proj.weight_scale": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.119.gate_proj.weight": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.119.gate_proj.weight_scale": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.119.up_proj.weight": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.119.up_proj.weight_scale": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.12.down_proj.weight": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.12.down_proj.weight_scale": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.12.gate_proj.weight": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.12.gate_proj.weight_scale": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.12.up_proj.weight": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.12.up_proj.weight_scale": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.120.down_proj.weight": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.120.down_proj.weight_scale": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.120.gate_proj.weight": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.120.gate_proj.weight_scale": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.120.up_proj.weight": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.120.up_proj.weight_scale": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.121.down_proj.weight": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.121.down_proj.weight_scale": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.121.gate_proj.weight": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.121.gate_proj.weight_scale": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.121.up_proj.weight": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.121.up_proj.weight_scale": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.122.down_proj.weight": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.122.down_proj.weight_scale": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.122.gate_proj.weight": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.122.gate_proj.weight_scale": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.122.up_proj.weight": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.122.up_proj.weight_scale": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.123.down_proj.weight": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.123.down_proj.weight_scale": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.123.gate_proj.weight": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.123.gate_proj.weight_scale": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.123.up_proj.weight": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.123.up_proj.weight_scale": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.124.down_proj.weight": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.124.down_proj.weight_scale": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.124.gate_proj.weight": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.124.gate_proj.weight_scale": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.124.up_proj.weight": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.124.up_proj.weight_scale": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.125.down_proj.weight": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.125.down_proj.weight_scale": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.125.gate_proj.weight": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.125.gate_proj.weight_scale": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.125.up_proj.weight": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.125.up_proj.weight_scale": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.126.down_proj.weight": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.126.down_proj.weight_scale": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.126.gate_proj.weight": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.126.gate_proj.weight_scale": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.126.up_proj.weight": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.126.up_proj.weight_scale": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.127.down_proj.weight": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.127.down_proj.weight_scale": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.127.gate_proj.weight": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.127.gate_proj.weight_scale": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.127.up_proj.weight": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.127.up_proj.weight_scale": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.128.down_proj.weight": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.128.down_proj.weight_scale": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.128.gate_proj.weight": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.128.gate_proj.weight_scale": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.128.up_proj.weight": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.128.up_proj.weight_scale": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.129.down_proj.weight": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.129.down_proj.weight_scale": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.129.gate_proj.weight": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.129.gate_proj.weight_scale": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.129.up_proj.weight": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.129.up_proj.weight_scale": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.13.down_proj.weight": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.13.down_proj.weight_scale": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.13.gate_proj.weight": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.13.gate_proj.weight_scale": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.13.up_proj.weight": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.13.up_proj.weight_scale": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.130.down_proj.weight": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.130.down_proj.weight_scale": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.130.gate_proj.weight": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.130.gate_proj.weight_scale": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.130.up_proj.weight": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.130.up_proj.weight_scale": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.131.down_proj.weight": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.131.down_proj.weight_scale": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.131.gate_proj.weight": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.131.gate_proj.weight_scale": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.131.up_proj.weight": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.131.up_proj.weight_scale": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.132.down_proj.weight": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.132.down_proj.weight_scale": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.132.gate_proj.weight": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.132.gate_proj.weight_scale": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.132.up_proj.weight": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.132.up_proj.weight_scale": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.133.down_proj.weight": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.133.down_proj.weight_scale": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.133.gate_proj.weight": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.133.gate_proj.weight_scale": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.133.up_proj.weight": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.133.up_proj.weight_scale": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.134.down_proj.weight": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.134.down_proj.weight_scale": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.134.gate_proj.weight": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.134.gate_proj.weight_scale": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.134.up_proj.weight": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.134.up_proj.weight_scale": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.135.down_proj.weight": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.135.down_proj.weight_scale": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.135.gate_proj.weight": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.135.gate_proj.weight_scale": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.135.up_proj.weight": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.135.up_proj.weight_scale": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.136.down_proj.weight": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.136.down_proj.weight_scale": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.136.gate_proj.weight": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.136.gate_proj.weight_scale": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.136.up_proj.weight": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.136.up_proj.weight_scale": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.137.down_proj.weight": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.137.down_proj.weight_scale": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.137.gate_proj.weight": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.137.gate_proj.weight_scale": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.137.up_proj.weight": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.137.up_proj.weight_scale": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.138.down_proj.weight": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.138.down_proj.weight_scale": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.138.gate_proj.weight": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.138.gate_proj.weight_scale": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.138.up_proj.weight": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.138.up_proj.weight_scale": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.139.down_proj.weight": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.139.down_proj.weight_scale": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.139.gate_proj.weight": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.139.gate_proj.weight_scale": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.139.up_proj.weight": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.139.up_proj.weight_scale": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.14.down_proj.weight": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.14.down_proj.weight_scale": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.14.gate_proj.weight": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.14.gate_proj.weight_scale": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.14.up_proj.weight": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.14.up_proj.weight_scale": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.140.down_proj.weight": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.140.down_proj.weight_scale": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.140.gate_proj.weight": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.140.gate_proj.weight_scale": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.140.up_proj.weight": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.140.up_proj.weight_scale": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.141.down_proj.weight": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.141.down_proj.weight_scale": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.141.gate_proj.weight": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.141.gate_proj.weight_scale": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.141.up_proj.weight": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.141.up_proj.weight_scale": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.142.down_proj.weight": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.142.down_proj.weight_scale": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.142.gate_proj.weight": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.142.gate_proj.weight_scale": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.142.up_proj.weight": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.142.up_proj.weight_scale": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.143.down_proj.weight": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.143.down_proj.weight_scale": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.143.gate_proj.weight": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.143.gate_proj.weight_scale": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.143.up_proj.weight": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.143.up_proj.weight_scale": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.144.down_proj.weight": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.144.down_proj.weight_scale": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.144.gate_proj.weight": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.144.gate_proj.weight_scale": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.144.up_proj.weight": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.144.up_proj.weight_scale": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.145.down_proj.weight": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.145.down_proj.weight_scale": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.145.gate_proj.weight": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.145.gate_proj.weight_scale": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.145.up_proj.weight": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.145.up_proj.weight_scale": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.146.down_proj.weight": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.146.down_proj.weight_scale": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.146.gate_proj.weight": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.146.gate_proj.weight_scale": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.146.up_proj.weight": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.146.up_proj.weight_scale": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.147.down_proj.weight": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.147.down_proj.weight_scale": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.147.gate_proj.weight": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.147.gate_proj.weight_scale": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.147.up_proj.weight": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.147.up_proj.weight_scale": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.148.down_proj.weight": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.148.down_proj.weight_scale": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.148.gate_proj.weight": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.148.gate_proj.weight_scale": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.148.up_proj.weight": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.148.up_proj.weight_scale": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.149.down_proj.weight": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.149.down_proj.weight_scale": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.149.gate_proj.weight": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.149.gate_proj.weight_scale": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.149.up_proj.weight": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.149.up_proj.weight_scale": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.15.down_proj.weight": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.15.down_proj.weight_scale": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.15.gate_proj.weight": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.15.gate_proj.weight_scale": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.15.up_proj.weight": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.15.up_proj.weight_scale": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.150.down_proj.weight": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.150.down_proj.weight_scale": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.150.gate_proj.weight": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.150.gate_proj.weight_scale": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.150.up_proj.weight": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.150.up_proj.weight_scale": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.151.down_proj.weight": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.151.down_proj.weight_scale": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.151.gate_proj.weight": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.151.gate_proj.weight_scale": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.151.up_proj.weight": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.151.up_proj.weight_scale": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.152.down_proj.weight": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.152.down_proj.weight_scale": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.152.gate_proj.weight": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.152.gate_proj.weight_scale": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.152.up_proj.weight": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.152.up_proj.weight_scale": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.153.down_proj.weight": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.153.down_proj.weight_scale": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.153.gate_proj.weight": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.153.gate_proj.weight_scale": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.153.up_proj.weight": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.153.up_proj.weight_scale": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.154.down_proj.weight": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.154.down_proj.weight_scale": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.154.gate_proj.weight": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.154.gate_proj.weight_scale": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.154.up_proj.weight": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.154.up_proj.weight_scale": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.155.down_proj.weight": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.155.down_proj.weight_scale": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.155.gate_proj.weight": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.155.gate_proj.weight_scale": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.155.up_proj.weight": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.155.up_proj.weight_scale": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.156.down_proj.weight": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.156.down_proj.weight_scale": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.156.gate_proj.weight": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.156.gate_proj.weight_scale": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.156.up_proj.weight": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.156.up_proj.weight_scale": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.157.down_proj.weight": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.157.down_proj.weight_scale": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.157.gate_proj.weight": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.157.gate_proj.weight_scale": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.157.up_proj.weight": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.157.up_proj.weight_scale": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.158.down_proj.weight": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.158.down_proj.weight_scale": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.158.gate_proj.weight": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.158.gate_proj.weight_scale": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.158.up_proj.weight": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.158.up_proj.weight_scale": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.159.down_proj.weight": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.159.down_proj.weight_scale": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.159.gate_proj.weight": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.159.gate_proj.weight_scale": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.159.up_proj.weight": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.159.up_proj.weight_scale": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.16.down_proj.weight": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.16.down_proj.weight_scale": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.16.gate_proj.weight": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.16.gate_proj.weight_scale": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.16.up_proj.weight": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.16.up_proj.weight_scale": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.17.down_proj.weight": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.17.down_proj.weight_scale": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.17.gate_proj.weight": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.17.gate_proj.weight_scale": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.17.up_proj.weight": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.17.up_proj.weight_scale": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.18.down_proj.weight": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.18.down_proj.weight_scale": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.18.gate_proj.weight": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.18.gate_proj.weight_scale": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.18.up_proj.weight": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.18.up_proj.weight_scale": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.19.down_proj.weight": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.19.down_proj.weight_scale": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.19.gate_proj.weight": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.19.gate_proj.weight_scale": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.19.up_proj.weight": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.19.up_proj.weight_scale": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.2.down_proj.weight": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.2.down_proj.weight_scale": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.2.gate_proj.weight": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.2.gate_proj.weight_scale": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.2.up_proj.weight": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.2.up_proj.weight_scale": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.20.down_proj.weight": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.20.down_proj.weight_scale": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.20.gate_proj.weight": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.20.gate_proj.weight_scale": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.20.up_proj.weight": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.20.up_proj.weight_scale": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.21.down_proj.weight": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.21.down_proj.weight_scale": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.21.gate_proj.weight": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.21.gate_proj.weight_scale": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.21.up_proj.weight": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.21.up_proj.weight_scale": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.22.down_proj.weight": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.22.down_proj.weight_scale": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.22.gate_proj.weight": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.22.gate_proj.weight_scale": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.22.up_proj.weight": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.22.up_proj.weight_scale": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.23.down_proj.weight": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.23.down_proj.weight_scale": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.23.gate_proj.weight": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.23.gate_proj.weight_scale": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.23.up_proj.weight": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.23.up_proj.weight_scale": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.24.down_proj.weight": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.24.down_proj.weight_scale": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.24.gate_proj.weight": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.24.gate_proj.weight_scale": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.24.up_proj.weight": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.24.up_proj.weight_scale": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.25.down_proj.weight": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.25.down_proj.weight_scale": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.25.gate_proj.weight": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.25.gate_proj.weight_scale": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.25.up_proj.weight": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.25.up_proj.weight_scale": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.26.down_proj.weight": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.26.down_proj.weight_scale": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.26.gate_proj.weight": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.26.gate_proj.weight_scale": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.26.up_proj.weight": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.26.up_proj.weight_scale": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.27.down_proj.weight": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.27.down_proj.weight_scale": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.27.gate_proj.weight": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.27.gate_proj.weight_scale": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.27.up_proj.weight": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.27.up_proj.weight_scale": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.28.down_proj.weight": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.28.down_proj.weight_scale": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.28.gate_proj.weight": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.28.gate_proj.weight_scale": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.28.up_proj.weight": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.28.up_proj.weight_scale": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.29.down_proj.weight": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.29.down_proj.weight_scale": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.29.gate_proj.weight": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.29.gate_proj.weight_scale": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.29.up_proj.weight": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.29.up_proj.weight_scale": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.3.down_proj.weight": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.3.down_proj.weight_scale": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.3.gate_proj.weight": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.3.gate_proj.weight_scale": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.3.up_proj.weight": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.3.up_proj.weight_scale": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.30.down_proj.weight": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.30.down_proj.weight_scale": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.30.gate_proj.weight": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.30.gate_proj.weight_scale": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.30.up_proj.weight": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.30.up_proj.weight_scale": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.31.down_proj.weight": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.31.down_proj.weight_scale": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.31.gate_proj.weight": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.31.gate_proj.weight_scale": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.31.up_proj.weight": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.31.up_proj.weight_scale": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.32.down_proj.weight": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.32.down_proj.weight_scale": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.32.gate_proj.weight": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.32.gate_proj.weight_scale": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.32.up_proj.weight": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.32.up_proj.weight_scale": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.33.down_proj.weight": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.33.down_proj.weight_scale": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.33.gate_proj.weight": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.33.gate_proj.weight_scale": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.33.up_proj.weight": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.33.up_proj.weight_scale": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.34.down_proj.weight": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.34.down_proj.weight_scale": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.34.gate_proj.weight": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.34.gate_proj.weight_scale": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.34.up_proj.weight": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.34.up_proj.weight_scale": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.35.down_proj.weight": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.35.down_proj.weight_scale": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.35.gate_proj.weight": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.35.gate_proj.weight_scale": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.35.up_proj.weight": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.35.up_proj.weight_scale": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.36.down_proj.weight": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.36.down_proj.weight_scale": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.36.gate_proj.weight": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.36.gate_proj.weight_scale": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.36.up_proj.weight": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.36.up_proj.weight_scale": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.37.down_proj.weight": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.37.down_proj.weight_scale": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.37.gate_proj.weight": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.37.gate_proj.weight_scale": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.37.up_proj.weight": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.37.up_proj.weight_scale": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.38.down_proj.weight": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.38.down_proj.weight_scale": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.38.gate_proj.weight": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.38.gate_proj.weight_scale": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.38.up_proj.weight": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.38.up_proj.weight_scale": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.39.down_proj.weight": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.39.down_proj.weight_scale": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.39.gate_proj.weight": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.39.gate_proj.weight_scale": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.39.up_proj.weight": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.39.up_proj.weight_scale": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.4.down_proj.weight": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.4.down_proj.weight_scale": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.4.gate_proj.weight": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.4.gate_proj.weight_scale": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.4.up_proj.weight": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.4.up_proj.weight_scale": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.40.down_proj.weight": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.40.down_proj.weight_scale": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.40.gate_proj.weight": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.40.gate_proj.weight_scale": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.40.up_proj.weight": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.40.up_proj.weight_scale": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.41.down_proj.weight": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.41.down_proj.weight_scale": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.41.gate_proj.weight": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.41.gate_proj.weight_scale": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.41.up_proj.weight": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.41.up_proj.weight_scale": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.42.down_proj.weight": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.42.down_proj.weight_scale": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.42.gate_proj.weight": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.42.gate_proj.weight_scale": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.42.up_proj.weight": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.42.up_proj.weight_scale": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.43.down_proj.weight": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.43.down_proj.weight_scale": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.43.gate_proj.weight": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.43.gate_proj.weight_scale": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.43.up_proj.weight": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.43.up_proj.weight_scale": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.44.down_proj.weight": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.44.down_proj.weight_scale": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.44.gate_proj.weight": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.44.gate_proj.weight_scale": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.44.up_proj.weight": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.44.up_proj.weight_scale": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.45.down_proj.weight": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.45.down_proj.weight_scale": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.45.gate_proj.weight": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.45.gate_proj.weight_scale": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.45.up_proj.weight": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.45.up_proj.weight_scale": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.46.down_proj.weight": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.46.down_proj.weight_scale": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.46.gate_proj.weight": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.46.gate_proj.weight_scale": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.46.up_proj.weight": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.46.up_proj.weight_scale": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.47.down_proj.weight": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.47.down_proj.weight_scale": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.47.gate_proj.weight": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.47.gate_proj.weight_scale": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.47.up_proj.weight": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.47.up_proj.weight_scale": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.48.down_proj.weight": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.48.down_proj.weight_scale": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.48.gate_proj.weight": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.48.gate_proj.weight_scale": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.48.up_proj.weight": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.48.up_proj.weight_scale": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.49.down_proj.weight": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.49.down_proj.weight_scale": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.49.gate_proj.weight": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.49.gate_proj.weight_scale": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.49.up_proj.weight": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.49.up_proj.weight_scale": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.5.down_proj.weight": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.5.down_proj.weight_scale": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.5.gate_proj.weight": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.5.gate_proj.weight_scale": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.5.up_proj.weight": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.5.up_proj.weight_scale": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.50.down_proj.weight": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.50.down_proj.weight_scale": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.50.gate_proj.weight": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.50.gate_proj.weight_scale": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.50.up_proj.weight": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.50.up_proj.weight_scale": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.51.down_proj.weight": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.51.down_proj.weight_scale": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.51.gate_proj.weight": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.51.gate_proj.weight_scale": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.51.up_proj.weight": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.51.up_proj.weight_scale": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.52.down_proj.weight": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.52.down_proj.weight_scale": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.52.gate_proj.weight": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.52.gate_proj.weight_scale": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.52.up_proj.weight": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.52.up_proj.weight_scale": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.53.down_proj.weight": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.53.down_proj.weight_scale": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.53.gate_proj.weight": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.53.gate_proj.weight_scale": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.53.up_proj.weight": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.53.up_proj.weight_scale": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.54.down_proj.weight": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.54.down_proj.weight_scale": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.54.gate_proj.weight": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.54.gate_proj.weight_scale": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.54.up_proj.weight": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.54.up_proj.weight_scale": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.55.down_proj.weight": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.55.down_proj.weight_scale": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.55.gate_proj.weight": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.55.gate_proj.weight_scale": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.55.up_proj.weight": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.55.up_proj.weight_scale": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.56.down_proj.weight": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.56.down_proj.weight_scale": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.56.gate_proj.weight": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.56.gate_proj.weight_scale": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.56.up_proj.weight": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.56.up_proj.weight_scale": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.57.down_proj.weight": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.57.down_proj.weight_scale": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.57.gate_proj.weight": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.57.gate_proj.weight_scale": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.57.up_proj.weight": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.57.up_proj.weight_scale": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.58.down_proj.weight": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.58.down_proj.weight_scale": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.58.gate_proj.weight": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.58.gate_proj.weight_scale": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.58.up_proj.weight": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.58.up_proj.weight_scale": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.59.down_proj.weight": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.59.down_proj.weight_scale": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.59.gate_proj.weight": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.59.gate_proj.weight_scale": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.59.up_proj.weight": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.59.up_proj.weight_scale": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.6.down_proj.weight": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.6.down_proj.weight_scale": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.6.gate_proj.weight": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.6.gate_proj.weight_scale": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.6.up_proj.weight": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.6.up_proj.weight_scale": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.60.down_proj.weight": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.60.down_proj.weight_scale": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.60.gate_proj.weight": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.60.gate_proj.weight_scale": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.60.up_proj.weight": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.60.up_proj.weight_scale": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.61.down_proj.weight": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.61.down_proj.weight_scale": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.61.gate_proj.weight": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.61.gate_proj.weight_scale": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.61.up_proj.weight": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.61.up_proj.weight_scale": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.62.down_proj.weight": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.62.down_proj.weight_scale": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.62.gate_proj.weight": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.62.gate_proj.weight_scale": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.62.up_proj.weight": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.62.up_proj.weight_scale": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.63.down_proj.weight": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.63.down_proj.weight_scale": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.63.gate_proj.weight": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.63.gate_proj.weight_scale": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.63.up_proj.weight": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.63.up_proj.weight_scale": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.64.down_proj.weight": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.64.down_proj.weight_scale": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.64.gate_proj.weight": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.64.gate_proj.weight_scale": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.64.up_proj.weight": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.64.up_proj.weight_scale": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.65.down_proj.weight": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.65.down_proj.weight_scale": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.65.gate_proj.weight": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.65.gate_proj.weight_scale": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.65.up_proj.weight": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.65.up_proj.weight_scale": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.66.down_proj.weight": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.66.down_proj.weight_scale": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.66.gate_proj.weight": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.66.gate_proj.weight_scale": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.66.up_proj.weight": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.66.up_proj.weight_scale": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.67.down_proj.weight": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.67.down_proj.weight_scale": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.67.gate_proj.weight": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.67.gate_proj.weight_scale": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.67.up_proj.weight": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.67.up_proj.weight_scale": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.68.down_proj.weight": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.68.down_proj.weight_scale": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.68.gate_proj.weight": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.68.gate_proj.weight_scale": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.68.up_proj.weight": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.68.up_proj.weight_scale": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.69.down_proj.weight": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.69.down_proj.weight_scale": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.69.gate_proj.weight": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.69.gate_proj.weight_scale": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.69.up_proj.weight": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.69.up_proj.weight_scale": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.7.down_proj.weight": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.7.down_proj.weight_scale": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.7.gate_proj.weight": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.7.gate_proj.weight_scale": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.7.up_proj.weight": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.7.up_proj.weight_scale": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.70.down_proj.weight": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.70.down_proj.weight_scale": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.70.gate_proj.weight": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.70.gate_proj.weight_scale": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.70.up_proj.weight": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.70.up_proj.weight_scale": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.71.down_proj.weight": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.71.down_proj.weight_scale": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.71.gate_proj.weight": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.71.gate_proj.weight_scale": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.71.up_proj.weight": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.71.up_proj.weight_scale": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.72.down_proj.weight": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.72.down_proj.weight_scale": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.72.gate_proj.weight": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.72.gate_proj.weight_scale": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.72.up_proj.weight": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.72.up_proj.weight_scale": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.73.down_proj.weight": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.73.down_proj.weight_scale": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.73.gate_proj.weight": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.73.gate_proj.weight_scale": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.73.up_proj.weight": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.73.up_proj.weight_scale": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.74.down_proj.weight": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.74.down_proj.weight_scale": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.74.gate_proj.weight": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.74.gate_proj.weight_scale": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.74.up_proj.weight": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.74.up_proj.weight_scale": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.75.down_proj.weight": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.75.down_proj.weight_scale": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.75.gate_proj.weight": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.75.gate_proj.weight_scale": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.75.up_proj.weight": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.75.up_proj.weight_scale": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.76.down_proj.weight": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.76.down_proj.weight_scale": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.76.gate_proj.weight": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.76.gate_proj.weight_scale": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.76.up_proj.weight": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.76.up_proj.weight_scale": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.77.down_proj.weight": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.77.down_proj.weight_scale": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.77.gate_proj.weight": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.77.gate_proj.weight_scale": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.77.up_proj.weight": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.77.up_proj.weight_scale": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.78.down_proj.weight": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.78.down_proj.weight_scale": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.78.gate_proj.weight": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.78.gate_proj.weight_scale": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.78.up_proj.weight": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.78.up_proj.weight_scale": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.79.down_proj.weight": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.79.down_proj.weight_scale": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.79.gate_proj.weight": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.79.gate_proj.weight_scale": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.79.up_proj.weight": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.79.up_proj.weight_scale": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.8.down_proj.weight": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.8.down_proj.weight_scale": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.8.gate_proj.weight": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.8.gate_proj.weight_scale": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.8.up_proj.weight": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.8.up_proj.weight_scale": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.80.down_proj.weight": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.80.down_proj.weight_scale": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.80.gate_proj.weight": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.80.gate_proj.weight_scale": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.80.up_proj.weight": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.80.up_proj.weight_scale": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.81.down_proj.weight": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.81.down_proj.weight_scale": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.81.gate_proj.weight": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.81.gate_proj.weight_scale": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.81.up_proj.weight": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.81.up_proj.weight_scale": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.82.down_proj.weight": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.82.down_proj.weight_scale": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.82.gate_proj.weight": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.82.gate_proj.weight_scale": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.82.up_proj.weight": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.82.up_proj.weight_scale": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.83.down_proj.weight": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.83.down_proj.weight_scale": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.83.gate_proj.weight": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.83.gate_proj.weight_scale": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.83.up_proj.weight": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.83.up_proj.weight_scale": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.84.down_proj.weight": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.84.down_proj.weight_scale": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.84.gate_proj.weight": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.84.gate_proj.weight_scale": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.84.up_proj.weight": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.84.up_proj.weight_scale": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.85.down_proj.weight": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.85.down_proj.weight_scale": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.85.gate_proj.weight": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.85.gate_proj.weight_scale": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.85.up_proj.weight": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.85.up_proj.weight_scale": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.86.down_proj.weight": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.86.down_proj.weight_scale": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.86.gate_proj.weight": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.86.gate_proj.weight_scale": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.86.up_proj.weight": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.86.up_proj.weight_scale": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.87.down_proj.weight": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.87.down_proj.weight_scale": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.87.gate_proj.weight": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.87.gate_proj.weight_scale": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.87.up_proj.weight": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.87.up_proj.weight_scale": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.88.down_proj.weight": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.88.down_proj.weight_scale": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.88.gate_proj.weight": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.88.gate_proj.weight_scale": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.88.up_proj.weight": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.88.up_proj.weight_scale": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.89.down_proj.weight": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.89.down_proj.weight_scale": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.89.gate_proj.weight": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.89.gate_proj.weight_scale": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.89.up_proj.weight": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.89.up_proj.weight_scale": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.9.down_proj.weight": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.9.down_proj.weight_scale": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.9.gate_proj.weight": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.9.gate_proj.weight_scale": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.9.up_proj.weight": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.9.up_proj.weight_scale": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.90.down_proj.weight": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.90.down_proj.weight_scale": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.90.gate_proj.weight": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.90.gate_proj.weight_scale": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.90.up_proj.weight": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.90.up_proj.weight_scale": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.91.down_proj.weight": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.91.down_proj.weight_scale": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.91.gate_proj.weight": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.91.gate_proj.weight_scale": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.91.up_proj.weight": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.91.up_proj.weight_scale": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.92.down_proj.weight": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.92.down_proj.weight_scale": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.92.gate_proj.weight": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.92.gate_proj.weight_scale": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.92.up_proj.weight": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.92.up_proj.weight_scale": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.93.down_proj.weight": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.93.down_proj.weight_scale": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.93.gate_proj.weight": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.93.gate_proj.weight_scale": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.93.up_proj.weight": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.93.up_proj.weight_scale": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.94.down_proj.weight": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.94.down_proj.weight_scale": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.94.gate_proj.weight": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.94.gate_proj.weight_scale": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.94.up_proj.weight": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.94.up_proj.weight_scale": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.95.down_proj.weight": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.95.down_proj.weight_scale": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.95.gate_proj.weight": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.95.gate_proj.weight_scale": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.95.up_proj.weight": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.95.up_proj.weight_scale": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.96.down_proj.weight": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.96.down_proj.weight_scale": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.96.gate_proj.weight": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.96.gate_proj.weight_scale": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.96.up_proj.weight": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.96.up_proj.weight_scale": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.97.down_proj.weight": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.97.down_proj.weight_scale": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.97.gate_proj.weight": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.97.gate_proj.weight_scale": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.97.up_proj.weight": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.97.up_proj.weight_scale": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.98.down_proj.weight": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.98.down_proj.weight_scale": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.98.gate_proj.weight": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.98.gate_proj.weight_scale": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.98.up_proj.weight": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.98.up_proj.weight_scale": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.99.down_proj.weight": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.99.down_proj.weight_scale": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.99.gate_proj.weight": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.99.gate_proj.weight_scale": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.99.up_proj.weight": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.99.up_proj.weight_scale": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.gate.e_score_correction_bias": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.gate.weight": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.shared_experts.down_proj.weight": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.shared_experts.down_proj.weight_scale": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.shared_experts.gate_proj.weight": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.shared_experts.gate_proj.weight_scale": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.shared_experts.up_proj.weight": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.shared_experts.up_proj.weight_scale": "model-00018-of-00092.safetensors",
+ "model.layers.17.post_attention_layernorm.weight": "model-00018-of-00092.safetensors",
+ "model.layers.17.self_attn.k_norm.weight": "model-00018-of-00092.safetensors",
+ "model.layers.17.self_attn.k_proj.bias": "model-00018-of-00092.safetensors",
+ "model.layers.17.self_attn.k_proj.weight": "model-00018-of-00092.safetensors",
+ "model.layers.17.self_attn.k_proj.weight_scale": "model-00018-of-00092.safetensors",
+ "model.layers.17.self_attn.o_proj.weight": "model-00018-of-00092.safetensors",
+ "model.layers.17.self_attn.o_proj.weight_scale": "model-00018-of-00092.safetensors",
+ "model.layers.17.self_attn.q_norm.weight": "model-00018-of-00092.safetensors",
+ "model.layers.17.self_attn.q_proj.bias": "model-00018-of-00092.safetensors",
+ "model.layers.17.self_attn.q_proj.weight": "model-00018-of-00092.safetensors",
+ "model.layers.17.self_attn.q_proj.weight_scale": "model-00018-of-00092.safetensors",
+ "model.layers.17.self_attn.v_proj.bias": "model-00018-of-00092.safetensors",
+ "model.layers.17.self_attn.v_proj.weight": "model-00018-of-00092.safetensors",
+ "model.layers.17.self_attn.v_proj.weight_scale": "model-00018-of-00092.safetensors",
+ "model.layers.18.input_layernorm.weight": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.0.down_proj.weight": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.0.down_proj.weight_scale": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.0.gate_proj.weight": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.0.gate_proj.weight_scale": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.0.up_proj.weight": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.0.up_proj.weight_scale": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.1.down_proj.weight": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.1.down_proj.weight_scale": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.1.gate_proj.weight": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.1.gate_proj.weight_scale": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.1.up_proj.weight": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.1.up_proj.weight_scale": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.10.down_proj.weight": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.10.down_proj.weight_scale": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.10.gate_proj.weight": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.10.gate_proj.weight_scale": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.10.up_proj.weight": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.10.up_proj.weight_scale": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.100.down_proj.weight": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.100.down_proj.weight_scale": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.100.gate_proj.weight": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.100.gate_proj.weight_scale": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.100.up_proj.weight": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.100.up_proj.weight_scale": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.101.down_proj.weight": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.101.down_proj.weight_scale": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.101.gate_proj.weight": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.101.gate_proj.weight_scale": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.101.up_proj.weight": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.101.up_proj.weight_scale": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.102.down_proj.weight": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.102.down_proj.weight_scale": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.102.gate_proj.weight": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.102.gate_proj.weight_scale": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.102.up_proj.weight": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.102.up_proj.weight_scale": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.103.down_proj.weight": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.103.down_proj.weight_scale": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.103.gate_proj.weight": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.103.gate_proj.weight_scale": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.103.up_proj.weight": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.103.up_proj.weight_scale": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.104.down_proj.weight": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.104.down_proj.weight_scale": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.104.gate_proj.weight": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.104.gate_proj.weight_scale": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.104.up_proj.weight": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.104.up_proj.weight_scale": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.105.down_proj.weight": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.105.down_proj.weight_scale": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.105.gate_proj.weight": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.105.gate_proj.weight_scale": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.105.up_proj.weight": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.105.up_proj.weight_scale": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.106.down_proj.weight": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.106.down_proj.weight_scale": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.106.gate_proj.weight": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.106.gate_proj.weight_scale": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.106.up_proj.weight": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.106.up_proj.weight_scale": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.107.down_proj.weight": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.107.down_proj.weight_scale": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.107.gate_proj.weight": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.107.gate_proj.weight_scale": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.107.up_proj.weight": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.107.up_proj.weight_scale": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.108.down_proj.weight": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.108.down_proj.weight_scale": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.108.gate_proj.weight": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.108.gate_proj.weight_scale": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.108.up_proj.weight": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.108.up_proj.weight_scale": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.109.down_proj.weight": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.109.down_proj.weight_scale": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.109.gate_proj.weight": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.109.gate_proj.weight_scale": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.109.up_proj.weight": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.109.up_proj.weight_scale": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.11.down_proj.weight": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.11.down_proj.weight_scale": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.11.gate_proj.weight": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.11.gate_proj.weight_scale": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.11.up_proj.weight": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.11.up_proj.weight_scale": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.110.down_proj.weight": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.110.down_proj.weight_scale": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.110.gate_proj.weight": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.110.gate_proj.weight_scale": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.110.up_proj.weight": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.110.up_proj.weight_scale": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.111.down_proj.weight": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.111.down_proj.weight_scale": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.111.gate_proj.weight": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.111.gate_proj.weight_scale": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.111.up_proj.weight": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.111.up_proj.weight_scale": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.112.down_proj.weight": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.112.down_proj.weight_scale": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.112.gate_proj.weight": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.112.gate_proj.weight_scale": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.112.up_proj.weight": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.112.up_proj.weight_scale": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.113.down_proj.weight": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.113.down_proj.weight_scale": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.113.gate_proj.weight": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.113.gate_proj.weight_scale": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.113.up_proj.weight": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.113.up_proj.weight_scale": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.114.down_proj.weight": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.114.down_proj.weight_scale": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.114.gate_proj.weight": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.114.gate_proj.weight_scale": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.114.up_proj.weight": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.114.up_proj.weight_scale": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.115.down_proj.weight": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.115.down_proj.weight_scale": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.115.gate_proj.weight": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.115.gate_proj.weight_scale": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.115.up_proj.weight": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.115.up_proj.weight_scale": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.116.down_proj.weight": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.116.down_proj.weight_scale": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.116.gate_proj.weight": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.116.gate_proj.weight_scale": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.116.up_proj.weight": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.116.up_proj.weight_scale": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.117.down_proj.weight": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.117.down_proj.weight_scale": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.117.gate_proj.weight": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.117.gate_proj.weight_scale": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.117.up_proj.weight": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.117.up_proj.weight_scale": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.118.down_proj.weight": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.118.down_proj.weight_scale": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.118.gate_proj.weight": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.118.gate_proj.weight_scale": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.118.up_proj.weight": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.118.up_proj.weight_scale": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.119.down_proj.weight": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.119.down_proj.weight_scale": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.119.gate_proj.weight": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.119.gate_proj.weight_scale": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.119.up_proj.weight": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.119.up_proj.weight_scale": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.12.down_proj.weight": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.12.down_proj.weight_scale": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.12.gate_proj.weight": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.12.gate_proj.weight_scale": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.12.up_proj.weight": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.12.up_proj.weight_scale": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.120.down_proj.weight": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.120.down_proj.weight_scale": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.120.gate_proj.weight": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.120.gate_proj.weight_scale": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.120.up_proj.weight": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.120.up_proj.weight_scale": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.121.down_proj.weight": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.121.down_proj.weight_scale": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.121.gate_proj.weight": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.121.gate_proj.weight_scale": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.121.up_proj.weight": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.121.up_proj.weight_scale": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.122.down_proj.weight": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.122.down_proj.weight_scale": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.122.gate_proj.weight": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.122.gate_proj.weight_scale": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.122.up_proj.weight": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.122.up_proj.weight_scale": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.123.down_proj.weight": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.123.down_proj.weight_scale": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.123.gate_proj.weight": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.123.gate_proj.weight_scale": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.123.up_proj.weight": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.123.up_proj.weight_scale": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.124.down_proj.weight": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.124.down_proj.weight_scale": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.124.gate_proj.weight": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.124.gate_proj.weight_scale": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.124.up_proj.weight": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.124.up_proj.weight_scale": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.125.down_proj.weight": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.125.down_proj.weight_scale": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.125.gate_proj.weight": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.125.gate_proj.weight_scale": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.125.up_proj.weight": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.125.up_proj.weight_scale": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.126.down_proj.weight": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.126.down_proj.weight_scale": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.126.gate_proj.weight": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.126.gate_proj.weight_scale": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.126.up_proj.weight": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.126.up_proj.weight_scale": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.127.down_proj.weight": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.127.down_proj.weight_scale": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.127.gate_proj.weight": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.127.gate_proj.weight_scale": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.127.up_proj.weight": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.127.up_proj.weight_scale": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.128.down_proj.weight": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.128.down_proj.weight_scale": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.128.gate_proj.weight": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.128.gate_proj.weight_scale": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.128.up_proj.weight": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.128.up_proj.weight_scale": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.129.down_proj.weight": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.129.down_proj.weight_scale": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.129.gate_proj.weight": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.129.gate_proj.weight_scale": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.129.up_proj.weight": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.129.up_proj.weight_scale": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.13.down_proj.weight": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.13.down_proj.weight_scale": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.13.gate_proj.weight": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.13.gate_proj.weight_scale": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.13.up_proj.weight": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.13.up_proj.weight_scale": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.130.down_proj.weight": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.130.down_proj.weight_scale": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.130.gate_proj.weight": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.130.gate_proj.weight_scale": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.130.up_proj.weight": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.130.up_proj.weight_scale": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.131.down_proj.weight": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.131.down_proj.weight_scale": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.131.gate_proj.weight": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.131.gate_proj.weight_scale": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.131.up_proj.weight": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.131.up_proj.weight_scale": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.132.down_proj.weight": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.132.down_proj.weight_scale": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.132.gate_proj.weight": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.132.gate_proj.weight_scale": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.132.up_proj.weight": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.132.up_proj.weight_scale": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.133.down_proj.weight": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.133.down_proj.weight_scale": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.133.gate_proj.weight": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.133.gate_proj.weight_scale": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.133.up_proj.weight": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.133.up_proj.weight_scale": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.134.down_proj.weight": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.134.down_proj.weight_scale": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.134.gate_proj.weight": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.134.gate_proj.weight_scale": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.134.up_proj.weight": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.134.up_proj.weight_scale": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.135.down_proj.weight": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.135.down_proj.weight_scale": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.135.gate_proj.weight": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.135.gate_proj.weight_scale": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.135.up_proj.weight": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.135.up_proj.weight_scale": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.136.down_proj.weight": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.136.down_proj.weight_scale": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.136.gate_proj.weight": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.136.gate_proj.weight_scale": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.136.up_proj.weight": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.136.up_proj.weight_scale": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.137.down_proj.weight": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.137.down_proj.weight_scale": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.137.gate_proj.weight": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.137.gate_proj.weight_scale": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.137.up_proj.weight": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.137.up_proj.weight_scale": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.138.down_proj.weight": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.138.down_proj.weight_scale": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.138.gate_proj.weight": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.138.gate_proj.weight_scale": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.138.up_proj.weight": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.138.up_proj.weight_scale": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.139.down_proj.weight": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.139.down_proj.weight_scale": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.139.gate_proj.weight": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.139.gate_proj.weight_scale": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.139.up_proj.weight": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.139.up_proj.weight_scale": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.14.down_proj.weight": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.14.down_proj.weight_scale": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.14.gate_proj.weight": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.14.gate_proj.weight_scale": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.14.up_proj.weight": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.14.up_proj.weight_scale": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.140.down_proj.weight": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.140.down_proj.weight_scale": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.140.gate_proj.weight": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.140.gate_proj.weight_scale": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.140.up_proj.weight": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.140.up_proj.weight_scale": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.141.down_proj.weight": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.141.down_proj.weight_scale": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.141.gate_proj.weight": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.141.gate_proj.weight_scale": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.141.up_proj.weight": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.141.up_proj.weight_scale": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.142.down_proj.weight": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.142.down_proj.weight_scale": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.142.gate_proj.weight": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.142.gate_proj.weight_scale": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.142.up_proj.weight": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.142.up_proj.weight_scale": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.143.down_proj.weight": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.143.down_proj.weight_scale": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.143.gate_proj.weight": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.143.gate_proj.weight_scale": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.143.up_proj.weight": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.143.up_proj.weight_scale": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.144.down_proj.weight": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.144.down_proj.weight_scale": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.144.gate_proj.weight": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.144.gate_proj.weight_scale": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.144.up_proj.weight": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.144.up_proj.weight_scale": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.145.down_proj.weight": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.145.down_proj.weight_scale": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.145.gate_proj.weight": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.145.gate_proj.weight_scale": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.145.up_proj.weight": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.145.up_proj.weight_scale": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.146.down_proj.weight": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.146.down_proj.weight_scale": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.146.gate_proj.weight": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.146.gate_proj.weight_scale": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.146.up_proj.weight": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.146.up_proj.weight_scale": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.147.down_proj.weight": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.147.down_proj.weight_scale": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.147.gate_proj.weight": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.147.gate_proj.weight_scale": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.147.up_proj.weight": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.147.up_proj.weight_scale": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.148.down_proj.weight": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.148.down_proj.weight_scale": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.148.gate_proj.weight": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.148.gate_proj.weight_scale": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.148.up_proj.weight": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.148.up_proj.weight_scale": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.149.down_proj.weight": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.149.down_proj.weight_scale": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.149.gate_proj.weight": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.149.gate_proj.weight_scale": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.149.up_proj.weight": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.149.up_proj.weight_scale": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.15.down_proj.weight": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.15.down_proj.weight_scale": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.15.gate_proj.weight": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.15.gate_proj.weight_scale": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.15.up_proj.weight": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.15.up_proj.weight_scale": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.150.down_proj.weight": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.150.down_proj.weight_scale": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.150.gate_proj.weight": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.150.gate_proj.weight_scale": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.150.up_proj.weight": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.150.up_proj.weight_scale": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.151.down_proj.weight": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.151.down_proj.weight_scale": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.151.gate_proj.weight": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.151.gate_proj.weight_scale": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.151.up_proj.weight": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.151.up_proj.weight_scale": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.152.down_proj.weight": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.152.down_proj.weight_scale": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.152.gate_proj.weight": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.152.gate_proj.weight_scale": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.152.up_proj.weight": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.152.up_proj.weight_scale": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.153.down_proj.weight": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.153.down_proj.weight_scale": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.153.gate_proj.weight": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.153.gate_proj.weight_scale": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.153.up_proj.weight": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.153.up_proj.weight_scale": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.154.down_proj.weight": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.154.down_proj.weight_scale": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.154.gate_proj.weight": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.154.gate_proj.weight_scale": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.154.up_proj.weight": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.154.up_proj.weight_scale": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.155.down_proj.weight": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.155.down_proj.weight_scale": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.155.gate_proj.weight": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.155.gate_proj.weight_scale": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.155.up_proj.weight": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.155.up_proj.weight_scale": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.156.down_proj.weight": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.156.down_proj.weight_scale": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.156.gate_proj.weight": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.156.gate_proj.weight_scale": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.156.up_proj.weight": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.156.up_proj.weight_scale": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.157.down_proj.weight": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.157.down_proj.weight_scale": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.157.gate_proj.weight": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.157.gate_proj.weight_scale": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.157.up_proj.weight": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.157.up_proj.weight_scale": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.158.down_proj.weight": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.158.down_proj.weight_scale": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.158.gate_proj.weight": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.158.gate_proj.weight_scale": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.158.up_proj.weight": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.158.up_proj.weight_scale": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.159.down_proj.weight": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.159.down_proj.weight_scale": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.159.gate_proj.weight": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.159.gate_proj.weight_scale": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.159.up_proj.weight": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.159.up_proj.weight_scale": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.16.down_proj.weight": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.16.down_proj.weight_scale": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.16.gate_proj.weight": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.16.gate_proj.weight_scale": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.16.up_proj.weight": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.16.up_proj.weight_scale": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.17.down_proj.weight": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.17.down_proj.weight_scale": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.17.gate_proj.weight": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.17.gate_proj.weight_scale": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.17.up_proj.weight": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.17.up_proj.weight_scale": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.18.down_proj.weight": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.18.down_proj.weight_scale": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.18.gate_proj.weight": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.18.gate_proj.weight_scale": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.18.up_proj.weight": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.18.up_proj.weight_scale": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.19.down_proj.weight": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.19.down_proj.weight_scale": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.19.gate_proj.weight": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.19.gate_proj.weight_scale": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.19.up_proj.weight": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.19.up_proj.weight_scale": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.2.down_proj.weight": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.2.down_proj.weight_scale": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.2.gate_proj.weight": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.2.gate_proj.weight_scale": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.2.up_proj.weight": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.2.up_proj.weight_scale": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.20.down_proj.weight": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.20.down_proj.weight_scale": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.20.gate_proj.weight": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.20.gate_proj.weight_scale": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.20.up_proj.weight": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.20.up_proj.weight_scale": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.21.down_proj.weight": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.21.down_proj.weight_scale": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.21.gate_proj.weight": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.21.gate_proj.weight_scale": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.21.up_proj.weight": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.21.up_proj.weight_scale": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.22.down_proj.weight": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.22.down_proj.weight_scale": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.22.gate_proj.weight": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.22.gate_proj.weight_scale": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.22.up_proj.weight": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.22.up_proj.weight_scale": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.23.down_proj.weight": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.23.down_proj.weight_scale": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.23.gate_proj.weight": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.23.gate_proj.weight_scale": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.23.up_proj.weight": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.23.up_proj.weight_scale": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.24.down_proj.weight": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.24.down_proj.weight_scale": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.24.gate_proj.weight": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.24.gate_proj.weight_scale": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.24.up_proj.weight": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.24.up_proj.weight_scale": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.25.down_proj.weight": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.25.down_proj.weight_scale": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.25.gate_proj.weight": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.25.gate_proj.weight_scale": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.25.up_proj.weight": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.25.up_proj.weight_scale": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.26.down_proj.weight": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.26.down_proj.weight_scale": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.26.gate_proj.weight": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.26.gate_proj.weight_scale": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.26.up_proj.weight": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.26.up_proj.weight_scale": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.27.down_proj.weight": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.27.down_proj.weight_scale": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.27.gate_proj.weight": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.27.gate_proj.weight_scale": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.27.up_proj.weight": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.27.up_proj.weight_scale": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.28.down_proj.weight": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.28.down_proj.weight_scale": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.28.gate_proj.weight": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.28.gate_proj.weight_scale": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.28.up_proj.weight": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.28.up_proj.weight_scale": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.29.down_proj.weight": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.29.down_proj.weight_scale": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.29.gate_proj.weight": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.29.gate_proj.weight_scale": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.29.up_proj.weight": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.29.up_proj.weight_scale": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.3.down_proj.weight": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.3.down_proj.weight_scale": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.3.gate_proj.weight": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.3.gate_proj.weight_scale": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.3.up_proj.weight": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.3.up_proj.weight_scale": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.30.down_proj.weight": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.30.down_proj.weight_scale": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.30.gate_proj.weight": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.30.gate_proj.weight_scale": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.30.up_proj.weight": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.30.up_proj.weight_scale": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.31.down_proj.weight": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.31.down_proj.weight_scale": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.31.gate_proj.weight": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.31.gate_proj.weight_scale": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.31.up_proj.weight": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.31.up_proj.weight_scale": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.32.down_proj.weight": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.32.down_proj.weight_scale": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.32.gate_proj.weight": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.32.gate_proj.weight_scale": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.32.up_proj.weight": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.32.up_proj.weight_scale": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.33.down_proj.weight": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.33.down_proj.weight_scale": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.33.gate_proj.weight": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.33.gate_proj.weight_scale": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.33.up_proj.weight": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.33.up_proj.weight_scale": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.34.down_proj.weight": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.34.down_proj.weight_scale": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.34.gate_proj.weight": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.34.gate_proj.weight_scale": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.34.up_proj.weight": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.34.up_proj.weight_scale": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.35.down_proj.weight": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.35.down_proj.weight_scale": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.35.gate_proj.weight": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.35.gate_proj.weight_scale": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.35.up_proj.weight": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.35.up_proj.weight_scale": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.36.down_proj.weight": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.36.down_proj.weight_scale": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.36.gate_proj.weight": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.36.gate_proj.weight_scale": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.36.up_proj.weight": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.36.up_proj.weight_scale": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.37.down_proj.weight": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.37.down_proj.weight_scale": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.37.gate_proj.weight": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.37.gate_proj.weight_scale": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.37.up_proj.weight": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.37.up_proj.weight_scale": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.38.down_proj.weight": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.38.down_proj.weight_scale": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.38.gate_proj.weight": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.38.gate_proj.weight_scale": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.38.up_proj.weight": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.38.up_proj.weight_scale": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.39.down_proj.weight": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.39.down_proj.weight_scale": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.39.gate_proj.weight": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.39.gate_proj.weight_scale": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.39.up_proj.weight": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.39.up_proj.weight_scale": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.4.down_proj.weight": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.4.down_proj.weight_scale": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.4.gate_proj.weight": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.4.gate_proj.weight_scale": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.4.up_proj.weight": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.4.up_proj.weight_scale": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.40.down_proj.weight": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.40.down_proj.weight_scale": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.40.gate_proj.weight": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.40.gate_proj.weight_scale": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.40.up_proj.weight": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.40.up_proj.weight_scale": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.41.down_proj.weight": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.41.down_proj.weight_scale": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.41.gate_proj.weight": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.41.gate_proj.weight_scale": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.41.up_proj.weight": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.41.up_proj.weight_scale": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.42.down_proj.weight": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.42.down_proj.weight_scale": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.42.gate_proj.weight": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.42.gate_proj.weight_scale": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.42.up_proj.weight": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.42.up_proj.weight_scale": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.43.down_proj.weight": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.43.down_proj.weight_scale": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.43.gate_proj.weight": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.43.gate_proj.weight_scale": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.43.up_proj.weight": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.43.up_proj.weight_scale": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.44.down_proj.weight": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.44.down_proj.weight_scale": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.44.gate_proj.weight": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.44.gate_proj.weight_scale": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.44.up_proj.weight": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.44.up_proj.weight_scale": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.45.down_proj.weight": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.45.down_proj.weight_scale": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.45.gate_proj.weight": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.45.gate_proj.weight_scale": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.45.up_proj.weight": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.45.up_proj.weight_scale": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.46.down_proj.weight": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.46.down_proj.weight_scale": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.46.gate_proj.weight": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.46.gate_proj.weight_scale": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.46.up_proj.weight": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.46.up_proj.weight_scale": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.47.down_proj.weight": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.47.down_proj.weight_scale": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.47.gate_proj.weight": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.47.gate_proj.weight_scale": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.47.up_proj.weight": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.47.up_proj.weight_scale": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.48.down_proj.weight": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.48.down_proj.weight_scale": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.48.gate_proj.weight": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.48.gate_proj.weight_scale": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.48.up_proj.weight": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.48.up_proj.weight_scale": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.49.down_proj.weight": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.49.down_proj.weight_scale": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.49.gate_proj.weight": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.49.gate_proj.weight_scale": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.49.up_proj.weight": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.49.up_proj.weight_scale": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.5.down_proj.weight": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.5.down_proj.weight_scale": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.5.gate_proj.weight": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.5.gate_proj.weight_scale": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.5.up_proj.weight": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.5.up_proj.weight_scale": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.50.down_proj.weight": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.50.down_proj.weight_scale": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.50.gate_proj.weight": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.50.gate_proj.weight_scale": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.50.up_proj.weight": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.50.up_proj.weight_scale": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.51.down_proj.weight": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.51.down_proj.weight_scale": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.51.gate_proj.weight": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.51.gate_proj.weight_scale": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.51.up_proj.weight": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.51.up_proj.weight_scale": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.52.down_proj.weight": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.52.down_proj.weight_scale": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.52.gate_proj.weight": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.52.gate_proj.weight_scale": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.52.up_proj.weight": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.52.up_proj.weight_scale": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.53.down_proj.weight": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.53.down_proj.weight_scale": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.53.gate_proj.weight": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.53.gate_proj.weight_scale": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.53.up_proj.weight": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.53.up_proj.weight_scale": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.54.down_proj.weight": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.54.down_proj.weight_scale": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.54.gate_proj.weight": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.54.gate_proj.weight_scale": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.54.up_proj.weight": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.54.up_proj.weight_scale": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.55.down_proj.weight": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.55.down_proj.weight_scale": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.55.gate_proj.weight": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.55.gate_proj.weight_scale": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.55.up_proj.weight": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.55.up_proj.weight_scale": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.56.down_proj.weight": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.56.down_proj.weight_scale": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.56.gate_proj.weight": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.56.gate_proj.weight_scale": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.56.up_proj.weight": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.56.up_proj.weight_scale": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.57.down_proj.weight": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.57.down_proj.weight_scale": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.57.gate_proj.weight": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.57.gate_proj.weight_scale": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.57.up_proj.weight": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.57.up_proj.weight_scale": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.58.down_proj.weight": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.58.down_proj.weight_scale": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.58.gate_proj.weight": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.58.gate_proj.weight_scale": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.58.up_proj.weight": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.58.up_proj.weight_scale": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.59.down_proj.weight": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.59.down_proj.weight_scale": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.59.gate_proj.weight": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.59.gate_proj.weight_scale": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.59.up_proj.weight": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.59.up_proj.weight_scale": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.6.down_proj.weight": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.6.down_proj.weight_scale": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.6.gate_proj.weight": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.6.gate_proj.weight_scale": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.6.up_proj.weight": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.6.up_proj.weight_scale": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.60.down_proj.weight": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.60.down_proj.weight_scale": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.60.gate_proj.weight": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.60.gate_proj.weight_scale": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.60.up_proj.weight": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.60.up_proj.weight_scale": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.61.down_proj.weight": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.61.down_proj.weight_scale": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.61.gate_proj.weight": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.61.gate_proj.weight_scale": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.61.up_proj.weight": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.61.up_proj.weight_scale": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.62.down_proj.weight": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.62.down_proj.weight_scale": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.62.gate_proj.weight": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.62.gate_proj.weight_scale": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.62.up_proj.weight": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.62.up_proj.weight_scale": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.63.down_proj.weight": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.63.down_proj.weight_scale": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.63.gate_proj.weight": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.63.gate_proj.weight_scale": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.63.up_proj.weight": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.63.up_proj.weight_scale": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.64.down_proj.weight": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.64.down_proj.weight_scale": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.64.gate_proj.weight": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.64.gate_proj.weight_scale": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.64.up_proj.weight": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.64.up_proj.weight_scale": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.65.down_proj.weight": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.65.down_proj.weight_scale": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.65.gate_proj.weight": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.65.gate_proj.weight_scale": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.65.up_proj.weight": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.65.up_proj.weight_scale": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.66.down_proj.weight": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.66.down_proj.weight_scale": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.66.gate_proj.weight": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.66.gate_proj.weight_scale": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.66.up_proj.weight": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.66.up_proj.weight_scale": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.67.down_proj.weight": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.67.down_proj.weight_scale": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.67.gate_proj.weight": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.67.gate_proj.weight_scale": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.67.up_proj.weight": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.67.up_proj.weight_scale": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.68.down_proj.weight": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.68.down_proj.weight_scale": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.68.gate_proj.weight": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.68.gate_proj.weight_scale": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.68.up_proj.weight": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.68.up_proj.weight_scale": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.69.down_proj.weight": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.69.down_proj.weight_scale": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.69.gate_proj.weight": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.69.gate_proj.weight_scale": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.69.up_proj.weight": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.69.up_proj.weight_scale": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.7.down_proj.weight": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.7.down_proj.weight_scale": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.7.gate_proj.weight": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.7.gate_proj.weight_scale": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.7.up_proj.weight": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.7.up_proj.weight_scale": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.70.down_proj.weight": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.70.down_proj.weight_scale": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.70.gate_proj.weight": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.70.gate_proj.weight_scale": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.70.up_proj.weight": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.70.up_proj.weight_scale": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.71.down_proj.weight": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.71.down_proj.weight_scale": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.71.gate_proj.weight": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.71.gate_proj.weight_scale": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.71.up_proj.weight": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.71.up_proj.weight_scale": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.72.down_proj.weight": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.72.down_proj.weight_scale": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.72.gate_proj.weight": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.72.gate_proj.weight_scale": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.72.up_proj.weight": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.72.up_proj.weight_scale": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.73.down_proj.weight": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.73.down_proj.weight_scale": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.73.gate_proj.weight": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.73.gate_proj.weight_scale": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.73.up_proj.weight": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.73.up_proj.weight_scale": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.74.down_proj.weight": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.74.down_proj.weight_scale": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.74.gate_proj.weight": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.74.gate_proj.weight_scale": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.74.up_proj.weight": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.74.up_proj.weight_scale": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.75.down_proj.weight": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.75.down_proj.weight_scale": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.75.gate_proj.weight": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.75.gate_proj.weight_scale": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.75.up_proj.weight": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.75.up_proj.weight_scale": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.76.down_proj.weight": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.76.down_proj.weight_scale": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.76.gate_proj.weight": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.76.gate_proj.weight_scale": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.76.up_proj.weight": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.76.up_proj.weight_scale": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.77.down_proj.weight": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.77.down_proj.weight_scale": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.77.gate_proj.weight": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.77.gate_proj.weight_scale": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.77.up_proj.weight": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.77.up_proj.weight_scale": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.78.down_proj.weight": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.78.down_proj.weight_scale": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.78.gate_proj.weight": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.78.gate_proj.weight_scale": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.78.up_proj.weight": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.78.up_proj.weight_scale": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.79.down_proj.weight": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.79.down_proj.weight_scale": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.79.gate_proj.weight": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.79.gate_proj.weight_scale": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.79.up_proj.weight": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.79.up_proj.weight_scale": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.8.down_proj.weight": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.8.down_proj.weight_scale": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.8.gate_proj.weight": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.8.gate_proj.weight_scale": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.8.up_proj.weight": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.8.up_proj.weight_scale": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.80.down_proj.weight": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.80.down_proj.weight_scale": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.80.gate_proj.weight": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.80.gate_proj.weight_scale": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.80.up_proj.weight": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.80.up_proj.weight_scale": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.81.down_proj.weight": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.81.down_proj.weight_scale": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.81.gate_proj.weight": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.81.gate_proj.weight_scale": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.81.up_proj.weight": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.81.up_proj.weight_scale": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.82.down_proj.weight": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.82.down_proj.weight_scale": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.82.gate_proj.weight": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.82.gate_proj.weight_scale": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.82.up_proj.weight": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.82.up_proj.weight_scale": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.83.down_proj.weight": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.83.down_proj.weight_scale": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.83.gate_proj.weight": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.83.gate_proj.weight_scale": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.83.up_proj.weight": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.83.up_proj.weight_scale": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.84.down_proj.weight": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.84.down_proj.weight_scale": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.84.gate_proj.weight": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.84.gate_proj.weight_scale": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.84.up_proj.weight": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.84.up_proj.weight_scale": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.85.down_proj.weight": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.85.down_proj.weight_scale": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.85.gate_proj.weight": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.85.gate_proj.weight_scale": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.85.up_proj.weight": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.85.up_proj.weight_scale": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.86.down_proj.weight": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.86.down_proj.weight_scale": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.86.gate_proj.weight": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.86.gate_proj.weight_scale": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.86.up_proj.weight": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.86.up_proj.weight_scale": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.87.down_proj.weight": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.87.down_proj.weight_scale": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.87.gate_proj.weight": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.87.gate_proj.weight_scale": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.87.up_proj.weight": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.87.up_proj.weight_scale": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.88.down_proj.weight": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.88.down_proj.weight_scale": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.88.gate_proj.weight": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.88.gate_proj.weight_scale": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.88.up_proj.weight": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.88.up_proj.weight_scale": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.89.down_proj.weight": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.89.down_proj.weight_scale": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.89.gate_proj.weight": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.89.gate_proj.weight_scale": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.89.up_proj.weight": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.89.up_proj.weight_scale": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.9.down_proj.weight": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.9.down_proj.weight_scale": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.9.gate_proj.weight": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.9.gate_proj.weight_scale": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.9.up_proj.weight": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.9.up_proj.weight_scale": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.90.down_proj.weight": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.90.down_proj.weight_scale": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.90.gate_proj.weight": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.90.gate_proj.weight_scale": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.90.up_proj.weight": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.90.up_proj.weight_scale": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.91.down_proj.weight": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.91.down_proj.weight_scale": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.91.gate_proj.weight": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.91.gate_proj.weight_scale": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.91.up_proj.weight": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.91.up_proj.weight_scale": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.92.down_proj.weight": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.92.down_proj.weight_scale": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.92.gate_proj.weight": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.92.gate_proj.weight_scale": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.92.up_proj.weight": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.92.up_proj.weight_scale": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.93.down_proj.weight": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.93.down_proj.weight_scale": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.93.gate_proj.weight": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.93.gate_proj.weight_scale": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.93.up_proj.weight": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.93.up_proj.weight_scale": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.94.down_proj.weight": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.94.down_proj.weight_scale": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.94.gate_proj.weight": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.94.gate_proj.weight_scale": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.94.up_proj.weight": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.94.up_proj.weight_scale": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.95.down_proj.weight": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.95.down_proj.weight_scale": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.95.gate_proj.weight": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.95.gate_proj.weight_scale": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.95.up_proj.weight": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.95.up_proj.weight_scale": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.96.down_proj.weight": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.96.down_proj.weight_scale": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.96.gate_proj.weight": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.96.gate_proj.weight_scale": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.96.up_proj.weight": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.96.up_proj.weight_scale": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.97.down_proj.weight": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.97.down_proj.weight_scale": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.97.gate_proj.weight": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.97.gate_proj.weight_scale": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.97.up_proj.weight": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.97.up_proj.weight_scale": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.98.down_proj.weight": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.98.down_proj.weight_scale": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.98.gate_proj.weight": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.98.gate_proj.weight_scale": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.98.up_proj.weight": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.98.up_proj.weight_scale": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.99.down_proj.weight": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.99.down_proj.weight_scale": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.99.gate_proj.weight": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.99.gate_proj.weight_scale": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.99.up_proj.weight": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.99.up_proj.weight_scale": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.gate.e_score_correction_bias": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.gate.weight": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.shared_experts.down_proj.weight": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.shared_experts.down_proj.weight_scale": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.shared_experts.gate_proj.weight": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.shared_experts.gate_proj.weight_scale": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.shared_experts.up_proj.weight": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.shared_experts.up_proj.weight_scale": "model-00019-of-00092.safetensors",
+ "model.layers.18.post_attention_layernorm.weight": "model-00019-of-00092.safetensors",
+ "model.layers.18.self_attn.k_norm.weight": "model-00019-of-00092.safetensors",
+ "model.layers.18.self_attn.k_proj.bias": "model-00019-of-00092.safetensors",
+ "model.layers.18.self_attn.k_proj.weight": "model-00019-of-00092.safetensors",
+ "model.layers.18.self_attn.k_proj.weight_scale": "model-00019-of-00092.safetensors",
+ "model.layers.18.self_attn.o_proj.weight": "model-00019-of-00092.safetensors",
+ "model.layers.18.self_attn.o_proj.weight_scale": "model-00019-of-00092.safetensors",
+ "model.layers.18.self_attn.q_norm.weight": "model-00019-of-00092.safetensors",
+ "model.layers.18.self_attn.q_proj.bias": "model-00019-of-00092.safetensors",
+ "model.layers.18.self_attn.q_proj.weight": "model-00019-of-00092.safetensors",
+ "model.layers.18.self_attn.q_proj.weight_scale": "model-00019-of-00092.safetensors",
+ "model.layers.18.self_attn.v_proj.bias": "model-00019-of-00092.safetensors",
+ "model.layers.18.self_attn.v_proj.weight": "model-00019-of-00092.safetensors",
+ "model.layers.18.self_attn.v_proj.weight_scale": "model-00019-of-00092.safetensors",
+ "model.layers.19.input_layernorm.weight": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.0.down_proj.weight": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.0.down_proj.weight_scale": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.0.gate_proj.weight": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.0.gate_proj.weight_scale": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.0.up_proj.weight": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.0.up_proj.weight_scale": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.1.down_proj.weight": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.1.down_proj.weight_scale": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.1.gate_proj.weight": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.1.gate_proj.weight_scale": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.1.up_proj.weight": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.1.up_proj.weight_scale": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.10.down_proj.weight": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.10.down_proj.weight_scale": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.10.gate_proj.weight": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.10.gate_proj.weight_scale": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.10.up_proj.weight": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.10.up_proj.weight_scale": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.100.down_proj.weight": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.100.down_proj.weight_scale": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.100.gate_proj.weight": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.100.gate_proj.weight_scale": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.100.up_proj.weight": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.100.up_proj.weight_scale": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.101.down_proj.weight": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.101.down_proj.weight_scale": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.101.gate_proj.weight": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.101.gate_proj.weight_scale": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.101.up_proj.weight": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.101.up_proj.weight_scale": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.102.down_proj.weight": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.102.down_proj.weight_scale": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.102.gate_proj.weight": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.102.gate_proj.weight_scale": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.102.up_proj.weight": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.102.up_proj.weight_scale": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.103.down_proj.weight": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.103.down_proj.weight_scale": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.103.gate_proj.weight": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.103.gate_proj.weight_scale": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.103.up_proj.weight": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.103.up_proj.weight_scale": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.104.down_proj.weight": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.104.down_proj.weight_scale": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.104.gate_proj.weight": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.104.gate_proj.weight_scale": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.104.up_proj.weight": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.104.up_proj.weight_scale": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.105.down_proj.weight": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.105.down_proj.weight_scale": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.105.gate_proj.weight": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.105.gate_proj.weight_scale": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.105.up_proj.weight": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.105.up_proj.weight_scale": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.106.down_proj.weight": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.106.down_proj.weight_scale": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.106.gate_proj.weight": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.106.gate_proj.weight_scale": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.106.up_proj.weight": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.106.up_proj.weight_scale": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.107.down_proj.weight": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.107.down_proj.weight_scale": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.107.gate_proj.weight": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.107.gate_proj.weight_scale": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.107.up_proj.weight": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.107.up_proj.weight_scale": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.108.down_proj.weight": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.108.down_proj.weight_scale": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.108.gate_proj.weight": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.108.gate_proj.weight_scale": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.108.up_proj.weight": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.108.up_proj.weight_scale": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.109.down_proj.weight": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.109.down_proj.weight_scale": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.109.gate_proj.weight": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.109.gate_proj.weight_scale": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.109.up_proj.weight": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.109.up_proj.weight_scale": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.11.down_proj.weight": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.11.down_proj.weight_scale": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.11.gate_proj.weight": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.11.gate_proj.weight_scale": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.11.up_proj.weight": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.11.up_proj.weight_scale": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.110.down_proj.weight": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.110.down_proj.weight_scale": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.110.gate_proj.weight": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.110.gate_proj.weight_scale": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.110.up_proj.weight": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.110.up_proj.weight_scale": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.111.down_proj.weight": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.111.down_proj.weight_scale": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.111.gate_proj.weight": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.111.gate_proj.weight_scale": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.111.up_proj.weight": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.111.up_proj.weight_scale": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.112.down_proj.weight": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.112.down_proj.weight_scale": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.112.gate_proj.weight": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.112.gate_proj.weight_scale": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.112.up_proj.weight": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.112.up_proj.weight_scale": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.113.down_proj.weight": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.113.down_proj.weight_scale": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.113.gate_proj.weight": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.113.gate_proj.weight_scale": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.113.up_proj.weight": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.113.up_proj.weight_scale": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.114.down_proj.weight": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.114.down_proj.weight_scale": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.114.gate_proj.weight": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.114.gate_proj.weight_scale": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.114.up_proj.weight": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.114.up_proj.weight_scale": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.115.down_proj.weight": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.115.down_proj.weight_scale": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.115.gate_proj.weight": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.115.gate_proj.weight_scale": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.115.up_proj.weight": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.115.up_proj.weight_scale": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.116.down_proj.weight": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.116.down_proj.weight_scale": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.116.gate_proj.weight": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.116.gate_proj.weight_scale": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.116.up_proj.weight": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.116.up_proj.weight_scale": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.117.down_proj.weight": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.117.down_proj.weight_scale": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.117.gate_proj.weight": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.117.gate_proj.weight_scale": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.117.up_proj.weight": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.117.up_proj.weight_scale": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.118.down_proj.weight": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.118.down_proj.weight_scale": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.118.gate_proj.weight": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.118.gate_proj.weight_scale": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.118.up_proj.weight": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.118.up_proj.weight_scale": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.119.down_proj.weight": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.119.down_proj.weight_scale": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.119.gate_proj.weight": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.119.gate_proj.weight_scale": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.119.up_proj.weight": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.119.up_proj.weight_scale": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.12.down_proj.weight": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.12.down_proj.weight_scale": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.12.gate_proj.weight": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.12.gate_proj.weight_scale": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.12.up_proj.weight": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.12.up_proj.weight_scale": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.120.down_proj.weight": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.120.down_proj.weight_scale": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.120.gate_proj.weight": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.120.gate_proj.weight_scale": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.120.up_proj.weight": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.120.up_proj.weight_scale": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.121.down_proj.weight": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.121.down_proj.weight_scale": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.121.gate_proj.weight": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.121.gate_proj.weight_scale": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.121.up_proj.weight": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.121.up_proj.weight_scale": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.122.down_proj.weight": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.122.down_proj.weight_scale": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.122.gate_proj.weight": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.122.gate_proj.weight_scale": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.122.up_proj.weight": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.122.up_proj.weight_scale": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.123.down_proj.weight": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.123.down_proj.weight_scale": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.123.gate_proj.weight": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.123.gate_proj.weight_scale": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.123.up_proj.weight": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.123.up_proj.weight_scale": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.124.down_proj.weight": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.124.down_proj.weight_scale": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.124.gate_proj.weight": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.124.gate_proj.weight_scale": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.124.up_proj.weight": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.124.up_proj.weight_scale": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.125.down_proj.weight": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.125.down_proj.weight_scale": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.125.gate_proj.weight": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.125.gate_proj.weight_scale": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.125.up_proj.weight": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.125.up_proj.weight_scale": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.126.down_proj.weight": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.126.down_proj.weight_scale": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.126.gate_proj.weight": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.126.gate_proj.weight_scale": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.126.up_proj.weight": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.126.up_proj.weight_scale": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.127.down_proj.weight": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.127.down_proj.weight_scale": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.127.gate_proj.weight": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.127.gate_proj.weight_scale": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.127.up_proj.weight": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.127.up_proj.weight_scale": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.128.down_proj.weight": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.128.down_proj.weight_scale": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.128.gate_proj.weight": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.128.gate_proj.weight_scale": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.128.up_proj.weight": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.128.up_proj.weight_scale": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.129.down_proj.weight": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.129.down_proj.weight_scale": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.129.gate_proj.weight": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.129.gate_proj.weight_scale": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.129.up_proj.weight": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.129.up_proj.weight_scale": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.13.down_proj.weight": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.13.down_proj.weight_scale": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.13.gate_proj.weight": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.13.gate_proj.weight_scale": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.13.up_proj.weight": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.13.up_proj.weight_scale": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.130.down_proj.weight": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.130.down_proj.weight_scale": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.130.gate_proj.weight": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.130.gate_proj.weight_scale": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.130.up_proj.weight": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.130.up_proj.weight_scale": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.131.down_proj.weight": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.131.down_proj.weight_scale": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.131.gate_proj.weight": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.131.gate_proj.weight_scale": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.131.up_proj.weight": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.131.up_proj.weight_scale": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.132.down_proj.weight": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.132.down_proj.weight_scale": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.132.gate_proj.weight": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.132.gate_proj.weight_scale": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.132.up_proj.weight": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.132.up_proj.weight_scale": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.133.down_proj.weight": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.133.down_proj.weight_scale": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.133.gate_proj.weight": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.133.gate_proj.weight_scale": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.133.up_proj.weight": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.133.up_proj.weight_scale": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.134.down_proj.weight": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.134.down_proj.weight_scale": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.134.gate_proj.weight": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.134.gate_proj.weight_scale": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.134.up_proj.weight": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.134.up_proj.weight_scale": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.135.down_proj.weight": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.135.down_proj.weight_scale": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.135.gate_proj.weight": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.135.gate_proj.weight_scale": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.135.up_proj.weight": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.135.up_proj.weight_scale": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.136.down_proj.weight": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.136.down_proj.weight_scale": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.136.gate_proj.weight": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.136.gate_proj.weight_scale": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.136.up_proj.weight": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.136.up_proj.weight_scale": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.137.down_proj.weight": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.137.down_proj.weight_scale": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.137.gate_proj.weight": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.137.gate_proj.weight_scale": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.137.up_proj.weight": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.137.up_proj.weight_scale": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.138.down_proj.weight": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.138.down_proj.weight_scale": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.138.gate_proj.weight": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.138.gate_proj.weight_scale": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.138.up_proj.weight": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.138.up_proj.weight_scale": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.139.down_proj.weight": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.139.down_proj.weight_scale": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.139.gate_proj.weight": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.139.gate_proj.weight_scale": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.139.up_proj.weight": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.139.up_proj.weight_scale": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.14.down_proj.weight": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.14.down_proj.weight_scale": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.14.gate_proj.weight": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.14.gate_proj.weight_scale": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.14.up_proj.weight": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.14.up_proj.weight_scale": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.140.down_proj.weight": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.140.down_proj.weight_scale": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.140.gate_proj.weight": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.140.gate_proj.weight_scale": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.140.up_proj.weight": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.140.up_proj.weight_scale": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.141.down_proj.weight": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.141.down_proj.weight_scale": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.141.gate_proj.weight": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.141.gate_proj.weight_scale": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.141.up_proj.weight": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.141.up_proj.weight_scale": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.142.down_proj.weight": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.142.down_proj.weight_scale": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.142.gate_proj.weight": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.142.gate_proj.weight_scale": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.142.up_proj.weight": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.142.up_proj.weight_scale": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.143.down_proj.weight": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.143.down_proj.weight_scale": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.143.gate_proj.weight": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.143.gate_proj.weight_scale": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.143.up_proj.weight": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.143.up_proj.weight_scale": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.144.down_proj.weight": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.144.down_proj.weight_scale": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.144.gate_proj.weight": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.144.gate_proj.weight_scale": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.144.up_proj.weight": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.144.up_proj.weight_scale": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.145.down_proj.weight": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.145.down_proj.weight_scale": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.145.gate_proj.weight": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.145.gate_proj.weight_scale": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.145.up_proj.weight": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.145.up_proj.weight_scale": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.146.down_proj.weight": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.146.down_proj.weight_scale": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.146.gate_proj.weight": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.146.gate_proj.weight_scale": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.146.up_proj.weight": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.146.up_proj.weight_scale": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.147.down_proj.weight": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.147.down_proj.weight_scale": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.147.gate_proj.weight": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.147.gate_proj.weight_scale": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.147.up_proj.weight": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.147.up_proj.weight_scale": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.148.down_proj.weight": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.148.down_proj.weight_scale": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.148.gate_proj.weight": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.148.gate_proj.weight_scale": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.148.up_proj.weight": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.148.up_proj.weight_scale": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.149.down_proj.weight": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.149.down_proj.weight_scale": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.149.gate_proj.weight": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.149.gate_proj.weight_scale": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.149.up_proj.weight": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.149.up_proj.weight_scale": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.15.down_proj.weight": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.15.down_proj.weight_scale": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.15.gate_proj.weight": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.15.gate_proj.weight_scale": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.15.up_proj.weight": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.15.up_proj.weight_scale": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.150.down_proj.weight": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.150.down_proj.weight_scale": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.150.gate_proj.weight": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.150.gate_proj.weight_scale": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.150.up_proj.weight": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.150.up_proj.weight_scale": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.151.down_proj.weight": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.151.down_proj.weight_scale": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.151.gate_proj.weight": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.151.gate_proj.weight_scale": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.151.up_proj.weight": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.151.up_proj.weight_scale": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.152.down_proj.weight": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.152.down_proj.weight_scale": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.152.gate_proj.weight": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.152.gate_proj.weight_scale": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.152.up_proj.weight": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.152.up_proj.weight_scale": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.153.down_proj.weight": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.153.down_proj.weight_scale": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.153.gate_proj.weight": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.153.gate_proj.weight_scale": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.153.up_proj.weight": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.153.up_proj.weight_scale": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.154.down_proj.weight": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.154.down_proj.weight_scale": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.154.gate_proj.weight": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.154.gate_proj.weight_scale": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.154.up_proj.weight": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.154.up_proj.weight_scale": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.155.down_proj.weight": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.155.down_proj.weight_scale": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.155.gate_proj.weight": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.155.gate_proj.weight_scale": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.155.up_proj.weight": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.155.up_proj.weight_scale": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.156.down_proj.weight": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.156.down_proj.weight_scale": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.156.gate_proj.weight": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.156.gate_proj.weight_scale": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.156.up_proj.weight": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.156.up_proj.weight_scale": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.157.down_proj.weight": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.157.down_proj.weight_scale": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.157.gate_proj.weight": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.157.gate_proj.weight_scale": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.157.up_proj.weight": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.157.up_proj.weight_scale": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.158.down_proj.weight": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.158.down_proj.weight_scale": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.158.gate_proj.weight": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.158.gate_proj.weight_scale": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.158.up_proj.weight": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.158.up_proj.weight_scale": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.159.down_proj.weight": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.159.down_proj.weight_scale": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.159.gate_proj.weight": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.159.gate_proj.weight_scale": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.159.up_proj.weight": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.159.up_proj.weight_scale": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.16.down_proj.weight": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.16.down_proj.weight_scale": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.16.gate_proj.weight": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.16.gate_proj.weight_scale": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.16.up_proj.weight": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.16.up_proj.weight_scale": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.17.down_proj.weight": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.17.down_proj.weight_scale": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.17.gate_proj.weight": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.17.gate_proj.weight_scale": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.17.up_proj.weight": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.17.up_proj.weight_scale": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.18.down_proj.weight": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.18.down_proj.weight_scale": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.18.gate_proj.weight": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.18.gate_proj.weight_scale": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.18.up_proj.weight": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.18.up_proj.weight_scale": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.19.down_proj.weight": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.19.down_proj.weight_scale": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.19.gate_proj.weight": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.19.gate_proj.weight_scale": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.19.up_proj.weight": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.19.up_proj.weight_scale": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.2.down_proj.weight": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.2.down_proj.weight_scale": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.2.gate_proj.weight": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.2.gate_proj.weight_scale": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.2.up_proj.weight": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.2.up_proj.weight_scale": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.20.down_proj.weight": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.20.down_proj.weight_scale": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.20.gate_proj.weight": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.20.gate_proj.weight_scale": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.20.up_proj.weight": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.20.up_proj.weight_scale": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.21.down_proj.weight": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.21.down_proj.weight_scale": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.21.gate_proj.weight": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.21.gate_proj.weight_scale": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.21.up_proj.weight": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.21.up_proj.weight_scale": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.22.down_proj.weight": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.22.down_proj.weight_scale": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.22.gate_proj.weight": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.22.gate_proj.weight_scale": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.22.up_proj.weight": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.22.up_proj.weight_scale": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.23.down_proj.weight": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.23.down_proj.weight_scale": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.23.gate_proj.weight": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.23.gate_proj.weight_scale": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.23.up_proj.weight": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.23.up_proj.weight_scale": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.24.down_proj.weight": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.24.down_proj.weight_scale": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.24.gate_proj.weight": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.24.gate_proj.weight_scale": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.24.up_proj.weight": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.24.up_proj.weight_scale": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.25.down_proj.weight": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.25.down_proj.weight_scale": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.25.gate_proj.weight": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.25.gate_proj.weight_scale": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.25.up_proj.weight": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.25.up_proj.weight_scale": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.26.down_proj.weight": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.26.down_proj.weight_scale": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.26.gate_proj.weight": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.26.gate_proj.weight_scale": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.26.up_proj.weight": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.26.up_proj.weight_scale": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.27.down_proj.weight": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.27.down_proj.weight_scale": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.27.gate_proj.weight": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.27.gate_proj.weight_scale": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.27.up_proj.weight": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.27.up_proj.weight_scale": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.28.down_proj.weight": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.28.down_proj.weight_scale": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.28.gate_proj.weight": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.28.gate_proj.weight_scale": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.28.up_proj.weight": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.28.up_proj.weight_scale": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.29.down_proj.weight": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.29.down_proj.weight_scale": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.29.gate_proj.weight": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.29.gate_proj.weight_scale": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.29.up_proj.weight": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.29.up_proj.weight_scale": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.3.down_proj.weight": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.3.down_proj.weight_scale": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.3.gate_proj.weight": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.3.gate_proj.weight_scale": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.3.up_proj.weight": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.3.up_proj.weight_scale": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.30.down_proj.weight": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.30.down_proj.weight_scale": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.30.gate_proj.weight": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.30.gate_proj.weight_scale": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.30.up_proj.weight": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.30.up_proj.weight_scale": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.31.down_proj.weight": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.31.down_proj.weight_scale": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.31.gate_proj.weight": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.31.gate_proj.weight_scale": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.31.up_proj.weight": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.31.up_proj.weight_scale": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.32.down_proj.weight": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.32.down_proj.weight_scale": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.32.gate_proj.weight": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.32.gate_proj.weight_scale": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.32.up_proj.weight": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.32.up_proj.weight_scale": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.33.down_proj.weight": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.33.down_proj.weight_scale": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.33.gate_proj.weight": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.33.gate_proj.weight_scale": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.33.up_proj.weight": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.33.up_proj.weight_scale": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.34.down_proj.weight": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.34.down_proj.weight_scale": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.34.gate_proj.weight": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.34.gate_proj.weight_scale": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.34.up_proj.weight": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.34.up_proj.weight_scale": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.35.down_proj.weight": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.35.down_proj.weight_scale": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.35.gate_proj.weight": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.35.gate_proj.weight_scale": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.35.up_proj.weight": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.35.up_proj.weight_scale": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.36.down_proj.weight": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.36.down_proj.weight_scale": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.36.gate_proj.weight": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.36.gate_proj.weight_scale": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.36.up_proj.weight": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.36.up_proj.weight_scale": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.37.down_proj.weight": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.37.down_proj.weight_scale": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.37.gate_proj.weight": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.37.gate_proj.weight_scale": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.37.up_proj.weight": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.37.up_proj.weight_scale": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.38.down_proj.weight": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.38.down_proj.weight_scale": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.38.gate_proj.weight": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.38.gate_proj.weight_scale": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.38.up_proj.weight": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.38.up_proj.weight_scale": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.39.down_proj.weight": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.39.down_proj.weight_scale": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.39.gate_proj.weight": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.39.gate_proj.weight_scale": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.39.up_proj.weight": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.39.up_proj.weight_scale": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.4.down_proj.weight": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.4.down_proj.weight_scale": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.4.gate_proj.weight": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.4.gate_proj.weight_scale": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.4.up_proj.weight": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.4.up_proj.weight_scale": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.40.down_proj.weight": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.40.down_proj.weight_scale": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.40.gate_proj.weight": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.40.gate_proj.weight_scale": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.40.up_proj.weight": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.40.up_proj.weight_scale": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.41.down_proj.weight": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.41.down_proj.weight_scale": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.41.gate_proj.weight": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.41.gate_proj.weight_scale": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.41.up_proj.weight": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.41.up_proj.weight_scale": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.42.down_proj.weight": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.42.down_proj.weight_scale": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.42.gate_proj.weight": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.42.gate_proj.weight_scale": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.42.up_proj.weight": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.42.up_proj.weight_scale": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.43.down_proj.weight": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.43.down_proj.weight_scale": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.43.gate_proj.weight": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.43.gate_proj.weight_scale": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.43.up_proj.weight": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.43.up_proj.weight_scale": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.44.down_proj.weight": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.44.down_proj.weight_scale": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.44.gate_proj.weight": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.44.gate_proj.weight_scale": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.44.up_proj.weight": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.44.up_proj.weight_scale": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.45.down_proj.weight": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.45.down_proj.weight_scale": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.45.gate_proj.weight": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.45.gate_proj.weight_scale": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.45.up_proj.weight": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.45.up_proj.weight_scale": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.46.down_proj.weight": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.46.down_proj.weight_scale": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.46.gate_proj.weight": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.46.gate_proj.weight_scale": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.46.up_proj.weight": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.46.up_proj.weight_scale": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.47.down_proj.weight": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.47.down_proj.weight_scale": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.47.gate_proj.weight": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.47.gate_proj.weight_scale": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.47.up_proj.weight": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.47.up_proj.weight_scale": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.48.down_proj.weight": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.48.down_proj.weight_scale": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.48.gate_proj.weight": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.48.gate_proj.weight_scale": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.48.up_proj.weight": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.48.up_proj.weight_scale": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.49.down_proj.weight": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.49.down_proj.weight_scale": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.49.gate_proj.weight": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.49.gate_proj.weight_scale": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.49.up_proj.weight": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.49.up_proj.weight_scale": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.5.down_proj.weight": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.5.down_proj.weight_scale": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.5.gate_proj.weight": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.5.gate_proj.weight_scale": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.5.up_proj.weight": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.5.up_proj.weight_scale": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.50.down_proj.weight": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.50.down_proj.weight_scale": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.50.gate_proj.weight": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.50.gate_proj.weight_scale": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.50.up_proj.weight": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.50.up_proj.weight_scale": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.51.down_proj.weight": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.51.down_proj.weight_scale": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.51.gate_proj.weight": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.51.gate_proj.weight_scale": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.51.up_proj.weight": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.51.up_proj.weight_scale": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.52.down_proj.weight": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.52.down_proj.weight_scale": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.52.gate_proj.weight": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.52.gate_proj.weight_scale": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.52.up_proj.weight": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.52.up_proj.weight_scale": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.53.down_proj.weight": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.53.down_proj.weight_scale": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.53.gate_proj.weight": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.53.gate_proj.weight_scale": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.53.up_proj.weight": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.53.up_proj.weight_scale": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.54.down_proj.weight": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.54.down_proj.weight_scale": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.54.gate_proj.weight": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.54.gate_proj.weight_scale": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.54.up_proj.weight": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.54.up_proj.weight_scale": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.55.down_proj.weight": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.55.down_proj.weight_scale": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.55.gate_proj.weight": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.55.gate_proj.weight_scale": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.55.up_proj.weight": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.55.up_proj.weight_scale": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.56.down_proj.weight": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.56.down_proj.weight_scale": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.56.gate_proj.weight": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.56.gate_proj.weight_scale": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.56.up_proj.weight": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.56.up_proj.weight_scale": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.57.down_proj.weight": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.57.down_proj.weight_scale": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.57.gate_proj.weight": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.57.gate_proj.weight_scale": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.57.up_proj.weight": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.57.up_proj.weight_scale": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.58.down_proj.weight": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.58.down_proj.weight_scale": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.58.gate_proj.weight": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.58.gate_proj.weight_scale": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.58.up_proj.weight": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.58.up_proj.weight_scale": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.59.down_proj.weight": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.59.down_proj.weight_scale": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.59.gate_proj.weight": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.59.gate_proj.weight_scale": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.59.up_proj.weight": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.59.up_proj.weight_scale": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.6.down_proj.weight": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.6.down_proj.weight_scale": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.6.gate_proj.weight": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.6.gate_proj.weight_scale": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.6.up_proj.weight": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.6.up_proj.weight_scale": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.60.down_proj.weight": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.60.down_proj.weight_scale": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.60.gate_proj.weight": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.60.gate_proj.weight_scale": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.60.up_proj.weight": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.60.up_proj.weight_scale": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.61.down_proj.weight": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.61.down_proj.weight_scale": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.61.gate_proj.weight": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.61.gate_proj.weight_scale": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.61.up_proj.weight": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.61.up_proj.weight_scale": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.62.down_proj.weight": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.62.down_proj.weight_scale": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.62.gate_proj.weight": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.62.gate_proj.weight_scale": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.62.up_proj.weight": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.62.up_proj.weight_scale": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.63.down_proj.weight": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.63.down_proj.weight_scale": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.63.gate_proj.weight": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.63.gate_proj.weight_scale": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.63.up_proj.weight": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.63.up_proj.weight_scale": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.64.down_proj.weight": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.64.down_proj.weight_scale": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.64.gate_proj.weight": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.64.gate_proj.weight_scale": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.64.up_proj.weight": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.64.up_proj.weight_scale": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.65.down_proj.weight": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.65.down_proj.weight_scale": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.65.gate_proj.weight": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.65.gate_proj.weight_scale": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.65.up_proj.weight": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.65.up_proj.weight_scale": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.66.down_proj.weight": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.66.down_proj.weight_scale": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.66.gate_proj.weight": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.66.gate_proj.weight_scale": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.66.up_proj.weight": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.66.up_proj.weight_scale": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.67.down_proj.weight": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.67.down_proj.weight_scale": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.67.gate_proj.weight": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.67.gate_proj.weight_scale": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.67.up_proj.weight": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.67.up_proj.weight_scale": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.68.down_proj.weight": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.68.down_proj.weight_scale": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.68.gate_proj.weight": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.68.gate_proj.weight_scale": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.68.up_proj.weight": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.68.up_proj.weight_scale": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.69.down_proj.weight": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.69.down_proj.weight_scale": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.69.gate_proj.weight": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.69.gate_proj.weight_scale": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.69.up_proj.weight": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.69.up_proj.weight_scale": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.7.down_proj.weight": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.7.down_proj.weight_scale": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.7.gate_proj.weight": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.7.gate_proj.weight_scale": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.7.up_proj.weight": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.7.up_proj.weight_scale": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.70.down_proj.weight": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.70.down_proj.weight_scale": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.70.gate_proj.weight": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.70.gate_proj.weight_scale": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.70.up_proj.weight": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.70.up_proj.weight_scale": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.71.down_proj.weight": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.71.down_proj.weight_scale": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.71.gate_proj.weight": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.71.gate_proj.weight_scale": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.71.up_proj.weight": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.71.up_proj.weight_scale": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.72.down_proj.weight": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.72.down_proj.weight_scale": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.72.gate_proj.weight": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.72.gate_proj.weight_scale": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.72.up_proj.weight": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.72.up_proj.weight_scale": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.73.down_proj.weight": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.73.down_proj.weight_scale": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.73.gate_proj.weight": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.73.gate_proj.weight_scale": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.73.up_proj.weight": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.73.up_proj.weight_scale": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.74.down_proj.weight": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.74.down_proj.weight_scale": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.74.gate_proj.weight": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.74.gate_proj.weight_scale": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.74.up_proj.weight": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.74.up_proj.weight_scale": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.75.down_proj.weight": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.75.down_proj.weight_scale": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.75.gate_proj.weight": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.75.gate_proj.weight_scale": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.75.up_proj.weight": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.75.up_proj.weight_scale": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.76.down_proj.weight": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.76.down_proj.weight_scale": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.76.gate_proj.weight": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.76.gate_proj.weight_scale": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.76.up_proj.weight": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.76.up_proj.weight_scale": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.77.down_proj.weight": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.77.down_proj.weight_scale": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.77.gate_proj.weight": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.77.gate_proj.weight_scale": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.77.up_proj.weight": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.77.up_proj.weight_scale": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.78.down_proj.weight": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.78.down_proj.weight_scale": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.78.gate_proj.weight": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.78.gate_proj.weight_scale": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.78.up_proj.weight": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.78.up_proj.weight_scale": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.79.down_proj.weight": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.79.down_proj.weight_scale": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.79.gate_proj.weight": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.79.gate_proj.weight_scale": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.79.up_proj.weight": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.79.up_proj.weight_scale": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.8.down_proj.weight": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.8.down_proj.weight_scale": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.8.gate_proj.weight": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.8.gate_proj.weight_scale": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.8.up_proj.weight": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.8.up_proj.weight_scale": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.80.down_proj.weight": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.80.down_proj.weight_scale": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.80.gate_proj.weight": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.80.gate_proj.weight_scale": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.80.up_proj.weight": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.80.up_proj.weight_scale": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.81.down_proj.weight": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.81.down_proj.weight_scale": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.81.gate_proj.weight": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.81.gate_proj.weight_scale": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.81.up_proj.weight": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.81.up_proj.weight_scale": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.82.down_proj.weight": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.82.down_proj.weight_scale": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.82.gate_proj.weight": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.82.gate_proj.weight_scale": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.82.up_proj.weight": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.82.up_proj.weight_scale": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.83.down_proj.weight": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.83.down_proj.weight_scale": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.83.gate_proj.weight": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.83.gate_proj.weight_scale": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.83.up_proj.weight": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.83.up_proj.weight_scale": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.84.down_proj.weight": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.84.down_proj.weight_scale": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.84.gate_proj.weight": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.84.gate_proj.weight_scale": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.84.up_proj.weight": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.84.up_proj.weight_scale": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.85.down_proj.weight": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.85.down_proj.weight_scale": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.85.gate_proj.weight": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.85.gate_proj.weight_scale": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.85.up_proj.weight": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.85.up_proj.weight_scale": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.86.down_proj.weight": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.86.down_proj.weight_scale": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.86.gate_proj.weight": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.86.gate_proj.weight_scale": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.86.up_proj.weight": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.86.up_proj.weight_scale": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.87.down_proj.weight": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.87.down_proj.weight_scale": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.87.gate_proj.weight": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.87.gate_proj.weight_scale": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.87.up_proj.weight": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.87.up_proj.weight_scale": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.88.down_proj.weight": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.88.down_proj.weight_scale": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.88.gate_proj.weight": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.88.gate_proj.weight_scale": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.88.up_proj.weight": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.88.up_proj.weight_scale": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.89.down_proj.weight": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.89.down_proj.weight_scale": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.89.gate_proj.weight": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.89.gate_proj.weight_scale": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.89.up_proj.weight": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.89.up_proj.weight_scale": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.9.down_proj.weight": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.9.down_proj.weight_scale": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.9.gate_proj.weight": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.9.gate_proj.weight_scale": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.9.up_proj.weight": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.9.up_proj.weight_scale": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.90.down_proj.weight": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.90.down_proj.weight_scale": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.90.gate_proj.weight": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.90.gate_proj.weight_scale": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.90.up_proj.weight": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.90.up_proj.weight_scale": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.91.down_proj.weight": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.91.down_proj.weight_scale": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.91.gate_proj.weight": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.91.gate_proj.weight_scale": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.91.up_proj.weight": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.91.up_proj.weight_scale": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.92.down_proj.weight": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.92.down_proj.weight_scale": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.92.gate_proj.weight": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.92.gate_proj.weight_scale": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.92.up_proj.weight": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.92.up_proj.weight_scale": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.93.down_proj.weight": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.93.down_proj.weight_scale": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.93.gate_proj.weight": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.93.gate_proj.weight_scale": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.93.up_proj.weight": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.93.up_proj.weight_scale": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.94.down_proj.weight": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.94.down_proj.weight_scale": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.94.gate_proj.weight": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.94.gate_proj.weight_scale": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.94.up_proj.weight": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.94.up_proj.weight_scale": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.95.down_proj.weight": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.95.down_proj.weight_scale": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.95.gate_proj.weight": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.95.gate_proj.weight_scale": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.95.up_proj.weight": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.95.up_proj.weight_scale": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.96.down_proj.weight": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.96.down_proj.weight_scale": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.96.gate_proj.weight": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.96.gate_proj.weight_scale": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.96.up_proj.weight": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.96.up_proj.weight_scale": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.97.down_proj.weight": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.97.down_proj.weight_scale": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.97.gate_proj.weight": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.97.gate_proj.weight_scale": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.97.up_proj.weight": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.97.up_proj.weight_scale": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.98.down_proj.weight": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.98.down_proj.weight_scale": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.98.gate_proj.weight": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.98.gate_proj.weight_scale": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.98.up_proj.weight": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.98.up_proj.weight_scale": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.99.down_proj.weight": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.99.down_proj.weight_scale": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.99.gate_proj.weight": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.99.gate_proj.weight_scale": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.99.up_proj.weight": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.99.up_proj.weight_scale": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.gate.e_score_correction_bias": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.gate.weight": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.shared_experts.down_proj.weight": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.shared_experts.down_proj.weight_scale": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.shared_experts.gate_proj.weight": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.shared_experts.gate_proj.weight_scale": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.shared_experts.up_proj.weight": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.shared_experts.up_proj.weight_scale": "model-00020-of-00092.safetensors",
+ "model.layers.19.post_attention_layernorm.weight": "model-00020-of-00092.safetensors",
+ "model.layers.19.self_attn.k_norm.weight": "model-00020-of-00092.safetensors",
+ "model.layers.19.self_attn.k_proj.bias": "model-00020-of-00092.safetensors",
+ "model.layers.19.self_attn.k_proj.weight": "model-00020-of-00092.safetensors",
+ "model.layers.19.self_attn.k_proj.weight_scale": "model-00020-of-00092.safetensors",
+ "model.layers.19.self_attn.o_proj.weight": "model-00020-of-00092.safetensors",
+ "model.layers.19.self_attn.o_proj.weight_scale": "model-00020-of-00092.safetensors",
+ "model.layers.19.self_attn.q_norm.weight": "model-00020-of-00092.safetensors",
+ "model.layers.19.self_attn.q_proj.bias": "model-00020-of-00092.safetensors",
+ "model.layers.19.self_attn.q_proj.weight": "model-00020-of-00092.safetensors",
+ "model.layers.19.self_attn.q_proj.weight_scale": "model-00020-of-00092.safetensors",
+ "model.layers.19.self_attn.v_proj.bias": "model-00020-of-00092.safetensors",
+ "model.layers.19.self_attn.v_proj.weight": "model-00020-of-00092.safetensors",
+ "model.layers.19.self_attn.v_proj.weight_scale": "model-00020-of-00092.safetensors",
+ "model.layers.20.input_layernorm.weight": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.0.down_proj.weight": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.0.down_proj.weight_scale": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.0.gate_proj.weight": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.0.gate_proj.weight_scale": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.0.up_proj.weight": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.0.up_proj.weight_scale": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.1.down_proj.weight": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.1.down_proj.weight_scale": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.1.gate_proj.weight": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.1.gate_proj.weight_scale": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.1.up_proj.weight": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.1.up_proj.weight_scale": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.10.down_proj.weight": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.10.down_proj.weight_scale": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.10.gate_proj.weight": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.10.gate_proj.weight_scale": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.10.up_proj.weight": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.10.up_proj.weight_scale": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.100.down_proj.weight": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.100.down_proj.weight_scale": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.100.gate_proj.weight": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.100.gate_proj.weight_scale": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.100.up_proj.weight": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.100.up_proj.weight_scale": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.101.down_proj.weight": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.101.down_proj.weight_scale": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.101.gate_proj.weight": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.101.gate_proj.weight_scale": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.101.up_proj.weight": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.101.up_proj.weight_scale": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.102.down_proj.weight": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.102.down_proj.weight_scale": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.102.gate_proj.weight": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.102.gate_proj.weight_scale": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.102.up_proj.weight": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.102.up_proj.weight_scale": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.103.down_proj.weight": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.103.down_proj.weight_scale": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.103.gate_proj.weight": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.103.gate_proj.weight_scale": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.103.up_proj.weight": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.103.up_proj.weight_scale": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.104.down_proj.weight": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.104.down_proj.weight_scale": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.104.gate_proj.weight": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.104.gate_proj.weight_scale": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.104.up_proj.weight": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.104.up_proj.weight_scale": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.105.down_proj.weight": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.105.down_proj.weight_scale": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.105.gate_proj.weight": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.105.gate_proj.weight_scale": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.105.up_proj.weight": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.105.up_proj.weight_scale": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.106.down_proj.weight": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.106.down_proj.weight_scale": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.106.gate_proj.weight": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.106.gate_proj.weight_scale": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.106.up_proj.weight": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.106.up_proj.weight_scale": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.107.down_proj.weight": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.107.down_proj.weight_scale": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.107.gate_proj.weight": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.107.gate_proj.weight_scale": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.107.up_proj.weight": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.107.up_proj.weight_scale": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.108.down_proj.weight": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.108.down_proj.weight_scale": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.108.gate_proj.weight": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.108.gate_proj.weight_scale": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.108.up_proj.weight": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.108.up_proj.weight_scale": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.109.down_proj.weight": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.109.down_proj.weight_scale": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.109.gate_proj.weight": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.109.gate_proj.weight_scale": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.109.up_proj.weight": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.109.up_proj.weight_scale": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.11.down_proj.weight": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.11.down_proj.weight_scale": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.11.gate_proj.weight": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.11.gate_proj.weight_scale": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.11.up_proj.weight": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.11.up_proj.weight_scale": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.110.down_proj.weight": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.110.down_proj.weight_scale": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.110.gate_proj.weight": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.110.gate_proj.weight_scale": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.110.up_proj.weight": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.110.up_proj.weight_scale": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.111.down_proj.weight": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.111.down_proj.weight_scale": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.111.gate_proj.weight": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.111.gate_proj.weight_scale": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.111.up_proj.weight": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.111.up_proj.weight_scale": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.112.down_proj.weight": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.112.down_proj.weight_scale": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.112.gate_proj.weight": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.112.gate_proj.weight_scale": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.112.up_proj.weight": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.112.up_proj.weight_scale": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.113.down_proj.weight": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.113.down_proj.weight_scale": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.113.gate_proj.weight": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.113.gate_proj.weight_scale": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.113.up_proj.weight": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.113.up_proj.weight_scale": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.114.down_proj.weight": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.114.down_proj.weight_scale": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.114.gate_proj.weight": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.114.gate_proj.weight_scale": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.114.up_proj.weight": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.114.up_proj.weight_scale": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.115.down_proj.weight": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.115.down_proj.weight_scale": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.115.gate_proj.weight": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.115.gate_proj.weight_scale": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.115.up_proj.weight": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.115.up_proj.weight_scale": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.116.down_proj.weight": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.116.down_proj.weight_scale": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.116.gate_proj.weight": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.116.gate_proj.weight_scale": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.116.up_proj.weight": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.116.up_proj.weight_scale": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.117.down_proj.weight": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.117.down_proj.weight_scale": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.117.gate_proj.weight": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.117.gate_proj.weight_scale": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.117.up_proj.weight": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.117.up_proj.weight_scale": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.118.down_proj.weight": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.118.down_proj.weight_scale": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.118.gate_proj.weight": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.118.gate_proj.weight_scale": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.118.up_proj.weight": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.118.up_proj.weight_scale": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.119.down_proj.weight": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.119.down_proj.weight_scale": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.119.gate_proj.weight": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.119.gate_proj.weight_scale": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.119.up_proj.weight": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.119.up_proj.weight_scale": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.12.down_proj.weight": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.12.down_proj.weight_scale": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.12.gate_proj.weight": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.12.gate_proj.weight_scale": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.12.up_proj.weight": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.12.up_proj.weight_scale": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.120.down_proj.weight": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.120.down_proj.weight_scale": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.120.gate_proj.weight": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.120.gate_proj.weight_scale": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.120.up_proj.weight": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.120.up_proj.weight_scale": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.121.down_proj.weight": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.121.down_proj.weight_scale": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.121.gate_proj.weight": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.121.gate_proj.weight_scale": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.121.up_proj.weight": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.121.up_proj.weight_scale": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.122.down_proj.weight": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.122.down_proj.weight_scale": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.122.gate_proj.weight": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.122.gate_proj.weight_scale": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.122.up_proj.weight": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.122.up_proj.weight_scale": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.123.down_proj.weight": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.123.down_proj.weight_scale": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.123.gate_proj.weight": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.123.gate_proj.weight_scale": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.123.up_proj.weight": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.123.up_proj.weight_scale": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.124.down_proj.weight": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.124.down_proj.weight_scale": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.124.gate_proj.weight": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.124.gate_proj.weight_scale": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.124.up_proj.weight": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.124.up_proj.weight_scale": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.125.down_proj.weight": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.125.down_proj.weight_scale": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.125.gate_proj.weight": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.125.gate_proj.weight_scale": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.125.up_proj.weight": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.125.up_proj.weight_scale": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.126.down_proj.weight": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.126.down_proj.weight_scale": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.126.gate_proj.weight": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.126.gate_proj.weight_scale": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.126.up_proj.weight": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.126.up_proj.weight_scale": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.127.down_proj.weight": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.127.down_proj.weight_scale": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.127.gate_proj.weight": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.127.gate_proj.weight_scale": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.127.up_proj.weight": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.127.up_proj.weight_scale": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.128.down_proj.weight": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.128.down_proj.weight_scale": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.128.gate_proj.weight": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.128.gate_proj.weight_scale": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.128.up_proj.weight": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.128.up_proj.weight_scale": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.129.down_proj.weight": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.129.down_proj.weight_scale": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.129.gate_proj.weight": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.129.gate_proj.weight_scale": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.129.up_proj.weight": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.129.up_proj.weight_scale": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.13.down_proj.weight": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.13.down_proj.weight_scale": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.13.gate_proj.weight": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.13.gate_proj.weight_scale": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.13.up_proj.weight": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.13.up_proj.weight_scale": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.130.down_proj.weight": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.130.down_proj.weight_scale": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.130.gate_proj.weight": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.130.gate_proj.weight_scale": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.130.up_proj.weight": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.130.up_proj.weight_scale": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.131.down_proj.weight": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.131.down_proj.weight_scale": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.131.gate_proj.weight": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.131.gate_proj.weight_scale": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.131.up_proj.weight": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.131.up_proj.weight_scale": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.132.down_proj.weight": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.132.down_proj.weight_scale": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.132.gate_proj.weight": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.132.gate_proj.weight_scale": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.132.up_proj.weight": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.132.up_proj.weight_scale": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.133.down_proj.weight": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.133.down_proj.weight_scale": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.133.gate_proj.weight": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.133.gate_proj.weight_scale": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.133.up_proj.weight": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.133.up_proj.weight_scale": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.134.down_proj.weight": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.134.down_proj.weight_scale": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.134.gate_proj.weight": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.134.gate_proj.weight_scale": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.134.up_proj.weight": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.134.up_proj.weight_scale": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.135.down_proj.weight": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.135.down_proj.weight_scale": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.135.gate_proj.weight": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.135.gate_proj.weight_scale": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.135.up_proj.weight": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.135.up_proj.weight_scale": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.136.down_proj.weight": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.136.down_proj.weight_scale": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.136.gate_proj.weight": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.136.gate_proj.weight_scale": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.136.up_proj.weight": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.136.up_proj.weight_scale": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.137.down_proj.weight": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.137.down_proj.weight_scale": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.137.gate_proj.weight": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.137.gate_proj.weight_scale": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.137.up_proj.weight": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.137.up_proj.weight_scale": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.138.down_proj.weight": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.138.down_proj.weight_scale": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.138.gate_proj.weight": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.138.gate_proj.weight_scale": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.138.up_proj.weight": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.138.up_proj.weight_scale": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.139.down_proj.weight": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.139.down_proj.weight_scale": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.139.gate_proj.weight": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.139.gate_proj.weight_scale": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.139.up_proj.weight": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.139.up_proj.weight_scale": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.14.down_proj.weight": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.14.down_proj.weight_scale": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.14.gate_proj.weight": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.14.gate_proj.weight_scale": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.14.up_proj.weight": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.14.up_proj.weight_scale": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.140.down_proj.weight": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.140.down_proj.weight_scale": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.140.gate_proj.weight": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.140.gate_proj.weight_scale": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.140.up_proj.weight": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.140.up_proj.weight_scale": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.141.down_proj.weight": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.141.down_proj.weight_scale": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.141.gate_proj.weight": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.141.gate_proj.weight_scale": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.141.up_proj.weight": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.141.up_proj.weight_scale": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.142.down_proj.weight": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.142.down_proj.weight_scale": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.142.gate_proj.weight": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.142.gate_proj.weight_scale": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.142.up_proj.weight": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.142.up_proj.weight_scale": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.143.down_proj.weight": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.143.down_proj.weight_scale": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.143.gate_proj.weight": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.143.gate_proj.weight_scale": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.143.up_proj.weight": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.143.up_proj.weight_scale": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.144.down_proj.weight": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.144.down_proj.weight_scale": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.144.gate_proj.weight": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.144.gate_proj.weight_scale": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.144.up_proj.weight": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.144.up_proj.weight_scale": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.145.down_proj.weight": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.145.down_proj.weight_scale": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.145.gate_proj.weight": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.145.gate_proj.weight_scale": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.145.up_proj.weight": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.145.up_proj.weight_scale": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.146.down_proj.weight": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.146.down_proj.weight_scale": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.146.gate_proj.weight": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.146.gate_proj.weight_scale": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.146.up_proj.weight": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.146.up_proj.weight_scale": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.147.down_proj.weight": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.147.down_proj.weight_scale": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.147.gate_proj.weight": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.147.gate_proj.weight_scale": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.147.up_proj.weight": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.147.up_proj.weight_scale": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.148.down_proj.weight": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.148.down_proj.weight_scale": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.148.gate_proj.weight": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.148.gate_proj.weight_scale": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.148.up_proj.weight": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.148.up_proj.weight_scale": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.149.down_proj.weight": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.149.down_proj.weight_scale": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.149.gate_proj.weight": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.149.gate_proj.weight_scale": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.149.up_proj.weight": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.149.up_proj.weight_scale": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.15.down_proj.weight": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.15.down_proj.weight_scale": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.15.gate_proj.weight": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.15.gate_proj.weight_scale": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.15.up_proj.weight": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.15.up_proj.weight_scale": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.150.down_proj.weight": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.150.down_proj.weight_scale": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.150.gate_proj.weight": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.150.gate_proj.weight_scale": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.150.up_proj.weight": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.150.up_proj.weight_scale": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.151.down_proj.weight": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.151.down_proj.weight_scale": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.151.gate_proj.weight": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.151.gate_proj.weight_scale": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.151.up_proj.weight": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.151.up_proj.weight_scale": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.152.down_proj.weight": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.152.down_proj.weight_scale": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.152.gate_proj.weight": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.152.gate_proj.weight_scale": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.152.up_proj.weight": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.152.up_proj.weight_scale": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.153.down_proj.weight": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.153.down_proj.weight_scale": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.153.gate_proj.weight": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.153.gate_proj.weight_scale": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.153.up_proj.weight": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.153.up_proj.weight_scale": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.154.down_proj.weight": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.154.down_proj.weight_scale": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.154.gate_proj.weight": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.154.gate_proj.weight_scale": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.154.up_proj.weight": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.154.up_proj.weight_scale": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.155.down_proj.weight": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.155.down_proj.weight_scale": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.155.gate_proj.weight": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.155.gate_proj.weight_scale": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.155.up_proj.weight": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.155.up_proj.weight_scale": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.156.down_proj.weight": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.156.down_proj.weight_scale": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.156.gate_proj.weight": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.156.gate_proj.weight_scale": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.156.up_proj.weight": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.156.up_proj.weight_scale": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.157.down_proj.weight": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.157.down_proj.weight_scale": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.157.gate_proj.weight": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.157.gate_proj.weight_scale": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.157.up_proj.weight": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.157.up_proj.weight_scale": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.158.down_proj.weight": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.158.down_proj.weight_scale": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.158.gate_proj.weight": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.158.gate_proj.weight_scale": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.158.up_proj.weight": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.158.up_proj.weight_scale": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.159.down_proj.weight": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.159.down_proj.weight_scale": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.159.gate_proj.weight": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.159.gate_proj.weight_scale": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.159.up_proj.weight": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.159.up_proj.weight_scale": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.16.down_proj.weight": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.16.down_proj.weight_scale": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.16.gate_proj.weight": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.16.gate_proj.weight_scale": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.16.up_proj.weight": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.16.up_proj.weight_scale": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.17.down_proj.weight": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.17.down_proj.weight_scale": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.17.gate_proj.weight": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.17.gate_proj.weight_scale": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.17.up_proj.weight": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.17.up_proj.weight_scale": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.18.down_proj.weight": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.18.down_proj.weight_scale": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.18.gate_proj.weight": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.18.gate_proj.weight_scale": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.18.up_proj.weight": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.18.up_proj.weight_scale": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.19.down_proj.weight": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.19.down_proj.weight_scale": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.19.gate_proj.weight": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.19.gate_proj.weight_scale": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.19.up_proj.weight": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.19.up_proj.weight_scale": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.2.down_proj.weight": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.2.down_proj.weight_scale": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.2.gate_proj.weight": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.2.gate_proj.weight_scale": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.2.up_proj.weight": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.2.up_proj.weight_scale": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.20.down_proj.weight": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.20.down_proj.weight_scale": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.20.gate_proj.weight": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.20.gate_proj.weight_scale": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.20.up_proj.weight": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.20.up_proj.weight_scale": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.21.down_proj.weight": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.21.down_proj.weight_scale": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.21.gate_proj.weight": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.21.gate_proj.weight_scale": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.21.up_proj.weight": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.21.up_proj.weight_scale": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.22.down_proj.weight": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.22.down_proj.weight_scale": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.22.gate_proj.weight": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.22.gate_proj.weight_scale": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.22.up_proj.weight": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.22.up_proj.weight_scale": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.23.down_proj.weight": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.23.down_proj.weight_scale": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.23.gate_proj.weight": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.23.gate_proj.weight_scale": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.23.up_proj.weight": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.23.up_proj.weight_scale": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.24.down_proj.weight": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.24.down_proj.weight_scale": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.24.gate_proj.weight": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.24.gate_proj.weight_scale": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.24.up_proj.weight": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.24.up_proj.weight_scale": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.25.down_proj.weight": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.25.down_proj.weight_scale": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.25.gate_proj.weight": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.25.gate_proj.weight_scale": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.25.up_proj.weight": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.25.up_proj.weight_scale": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.26.down_proj.weight": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.26.down_proj.weight_scale": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.26.gate_proj.weight": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.26.gate_proj.weight_scale": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.26.up_proj.weight": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.26.up_proj.weight_scale": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.27.down_proj.weight": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.27.down_proj.weight_scale": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.27.gate_proj.weight": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.27.gate_proj.weight_scale": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.27.up_proj.weight": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.27.up_proj.weight_scale": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.28.down_proj.weight": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.28.down_proj.weight_scale": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.28.gate_proj.weight": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.28.gate_proj.weight_scale": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.28.up_proj.weight": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.28.up_proj.weight_scale": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.29.down_proj.weight": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.29.down_proj.weight_scale": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.29.gate_proj.weight": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.29.gate_proj.weight_scale": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.29.up_proj.weight": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.29.up_proj.weight_scale": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.3.down_proj.weight": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.3.down_proj.weight_scale": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.3.gate_proj.weight": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.3.gate_proj.weight_scale": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.3.up_proj.weight": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.3.up_proj.weight_scale": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.30.down_proj.weight": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.30.down_proj.weight_scale": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.30.gate_proj.weight": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.30.gate_proj.weight_scale": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.30.up_proj.weight": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.30.up_proj.weight_scale": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.31.down_proj.weight": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.31.down_proj.weight_scale": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.31.gate_proj.weight": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.31.gate_proj.weight_scale": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.31.up_proj.weight": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.31.up_proj.weight_scale": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.32.down_proj.weight": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.32.down_proj.weight_scale": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.32.gate_proj.weight": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.32.gate_proj.weight_scale": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.32.up_proj.weight": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.32.up_proj.weight_scale": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.33.down_proj.weight": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.33.down_proj.weight_scale": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.33.gate_proj.weight": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.33.gate_proj.weight_scale": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.33.up_proj.weight": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.33.up_proj.weight_scale": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.34.down_proj.weight": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.34.down_proj.weight_scale": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.34.gate_proj.weight": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.34.gate_proj.weight_scale": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.34.up_proj.weight": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.34.up_proj.weight_scale": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.35.down_proj.weight": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.35.down_proj.weight_scale": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.35.gate_proj.weight": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.35.gate_proj.weight_scale": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.35.up_proj.weight": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.35.up_proj.weight_scale": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.36.down_proj.weight": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.36.down_proj.weight_scale": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.36.gate_proj.weight": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.36.gate_proj.weight_scale": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.36.up_proj.weight": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.36.up_proj.weight_scale": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.37.down_proj.weight": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.37.down_proj.weight_scale": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.37.gate_proj.weight": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.37.gate_proj.weight_scale": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.37.up_proj.weight": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.37.up_proj.weight_scale": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.38.down_proj.weight": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.38.down_proj.weight_scale": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.38.gate_proj.weight": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.38.gate_proj.weight_scale": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.38.up_proj.weight": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.38.up_proj.weight_scale": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.39.down_proj.weight": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.39.down_proj.weight_scale": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.39.gate_proj.weight": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.39.gate_proj.weight_scale": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.39.up_proj.weight": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.39.up_proj.weight_scale": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.4.down_proj.weight": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.4.down_proj.weight_scale": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.4.gate_proj.weight": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.4.gate_proj.weight_scale": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.4.up_proj.weight": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.4.up_proj.weight_scale": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.40.down_proj.weight": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.40.down_proj.weight_scale": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.40.gate_proj.weight": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.40.gate_proj.weight_scale": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.40.up_proj.weight": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.40.up_proj.weight_scale": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.41.down_proj.weight": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.41.down_proj.weight_scale": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.41.gate_proj.weight": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.41.gate_proj.weight_scale": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.41.up_proj.weight": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.41.up_proj.weight_scale": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.42.down_proj.weight": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.42.down_proj.weight_scale": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.42.gate_proj.weight": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.42.gate_proj.weight_scale": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.42.up_proj.weight": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.42.up_proj.weight_scale": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.43.down_proj.weight": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.43.down_proj.weight_scale": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.43.gate_proj.weight": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.43.gate_proj.weight_scale": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.43.up_proj.weight": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.43.up_proj.weight_scale": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.44.down_proj.weight": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.44.down_proj.weight_scale": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.44.gate_proj.weight": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.44.gate_proj.weight_scale": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.44.up_proj.weight": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.44.up_proj.weight_scale": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.45.down_proj.weight": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.45.down_proj.weight_scale": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.45.gate_proj.weight": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.45.gate_proj.weight_scale": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.45.up_proj.weight": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.45.up_proj.weight_scale": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.46.down_proj.weight": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.46.down_proj.weight_scale": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.46.gate_proj.weight": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.46.gate_proj.weight_scale": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.46.up_proj.weight": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.46.up_proj.weight_scale": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.47.down_proj.weight": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.47.down_proj.weight_scale": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.47.gate_proj.weight": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.47.gate_proj.weight_scale": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.47.up_proj.weight": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.47.up_proj.weight_scale": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.48.down_proj.weight": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.48.down_proj.weight_scale": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.48.gate_proj.weight": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.48.gate_proj.weight_scale": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.48.up_proj.weight": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.48.up_proj.weight_scale": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.49.down_proj.weight": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.49.down_proj.weight_scale": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.49.gate_proj.weight": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.49.gate_proj.weight_scale": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.49.up_proj.weight": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.49.up_proj.weight_scale": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.5.down_proj.weight": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.5.down_proj.weight_scale": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.5.gate_proj.weight": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.5.gate_proj.weight_scale": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.5.up_proj.weight": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.5.up_proj.weight_scale": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.50.down_proj.weight": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.50.down_proj.weight_scale": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.50.gate_proj.weight": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.50.gate_proj.weight_scale": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.50.up_proj.weight": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.50.up_proj.weight_scale": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.51.down_proj.weight": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.51.down_proj.weight_scale": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.51.gate_proj.weight": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.51.gate_proj.weight_scale": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.51.up_proj.weight": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.51.up_proj.weight_scale": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.52.down_proj.weight": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.52.down_proj.weight_scale": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.52.gate_proj.weight": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.52.gate_proj.weight_scale": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.52.up_proj.weight": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.52.up_proj.weight_scale": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.53.down_proj.weight": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.53.down_proj.weight_scale": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.53.gate_proj.weight": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.53.gate_proj.weight_scale": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.53.up_proj.weight": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.53.up_proj.weight_scale": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.54.down_proj.weight": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.54.down_proj.weight_scale": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.54.gate_proj.weight": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.54.gate_proj.weight_scale": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.54.up_proj.weight": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.54.up_proj.weight_scale": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.55.down_proj.weight": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.55.down_proj.weight_scale": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.55.gate_proj.weight": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.55.gate_proj.weight_scale": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.55.up_proj.weight": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.55.up_proj.weight_scale": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.56.down_proj.weight": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.56.down_proj.weight_scale": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.56.gate_proj.weight": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.56.gate_proj.weight_scale": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.56.up_proj.weight": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.56.up_proj.weight_scale": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.57.down_proj.weight": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.57.down_proj.weight_scale": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.57.gate_proj.weight": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.57.gate_proj.weight_scale": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.57.up_proj.weight": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.57.up_proj.weight_scale": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.58.down_proj.weight": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.58.down_proj.weight_scale": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.58.gate_proj.weight": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.58.gate_proj.weight_scale": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.58.up_proj.weight": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.58.up_proj.weight_scale": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.59.down_proj.weight": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.59.down_proj.weight_scale": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.59.gate_proj.weight": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.59.gate_proj.weight_scale": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.59.up_proj.weight": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.59.up_proj.weight_scale": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.6.down_proj.weight": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.6.down_proj.weight_scale": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.6.gate_proj.weight": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.6.gate_proj.weight_scale": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.6.up_proj.weight": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.6.up_proj.weight_scale": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.60.down_proj.weight": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.60.down_proj.weight_scale": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.60.gate_proj.weight": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.60.gate_proj.weight_scale": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.60.up_proj.weight": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.60.up_proj.weight_scale": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.61.down_proj.weight": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.61.down_proj.weight_scale": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.61.gate_proj.weight": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.61.gate_proj.weight_scale": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.61.up_proj.weight": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.61.up_proj.weight_scale": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.62.down_proj.weight": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.62.down_proj.weight_scale": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.62.gate_proj.weight": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.62.gate_proj.weight_scale": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.62.up_proj.weight": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.62.up_proj.weight_scale": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.63.down_proj.weight": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.63.down_proj.weight_scale": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.63.gate_proj.weight": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.63.gate_proj.weight_scale": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.63.up_proj.weight": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.63.up_proj.weight_scale": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.64.down_proj.weight": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.64.down_proj.weight_scale": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.64.gate_proj.weight": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.64.gate_proj.weight_scale": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.64.up_proj.weight": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.64.up_proj.weight_scale": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.65.down_proj.weight": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.65.down_proj.weight_scale": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.65.gate_proj.weight": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.65.gate_proj.weight_scale": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.65.up_proj.weight": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.65.up_proj.weight_scale": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.66.down_proj.weight": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.66.down_proj.weight_scale": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.66.gate_proj.weight": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.66.gate_proj.weight_scale": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.66.up_proj.weight": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.66.up_proj.weight_scale": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.67.down_proj.weight": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.67.down_proj.weight_scale": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.67.gate_proj.weight": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.67.gate_proj.weight_scale": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.67.up_proj.weight": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.67.up_proj.weight_scale": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.68.down_proj.weight": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.68.down_proj.weight_scale": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.68.gate_proj.weight": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.68.gate_proj.weight_scale": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.68.up_proj.weight": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.68.up_proj.weight_scale": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.69.down_proj.weight": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.69.down_proj.weight_scale": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.69.gate_proj.weight": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.69.gate_proj.weight_scale": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.69.up_proj.weight": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.69.up_proj.weight_scale": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.7.down_proj.weight": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.7.down_proj.weight_scale": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.7.gate_proj.weight": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.7.gate_proj.weight_scale": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.7.up_proj.weight": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.7.up_proj.weight_scale": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.70.down_proj.weight": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.70.down_proj.weight_scale": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.70.gate_proj.weight": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.70.gate_proj.weight_scale": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.70.up_proj.weight": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.70.up_proj.weight_scale": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.71.down_proj.weight": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.71.down_proj.weight_scale": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.71.gate_proj.weight": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.71.gate_proj.weight_scale": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.71.up_proj.weight": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.71.up_proj.weight_scale": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.72.down_proj.weight": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.72.down_proj.weight_scale": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.72.gate_proj.weight": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.72.gate_proj.weight_scale": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.72.up_proj.weight": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.72.up_proj.weight_scale": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.73.down_proj.weight": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.73.down_proj.weight_scale": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.73.gate_proj.weight": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.73.gate_proj.weight_scale": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.73.up_proj.weight": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.73.up_proj.weight_scale": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.74.down_proj.weight": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.74.down_proj.weight_scale": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.74.gate_proj.weight": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.74.gate_proj.weight_scale": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.74.up_proj.weight": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.74.up_proj.weight_scale": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.75.down_proj.weight": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.75.down_proj.weight_scale": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.75.gate_proj.weight": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.75.gate_proj.weight_scale": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.75.up_proj.weight": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.75.up_proj.weight_scale": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.76.down_proj.weight": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.76.down_proj.weight_scale": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.76.gate_proj.weight": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.76.gate_proj.weight_scale": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.76.up_proj.weight": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.76.up_proj.weight_scale": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.77.down_proj.weight": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.77.down_proj.weight_scale": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.77.gate_proj.weight": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.77.gate_proj.weight_scale": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.77.up_proj.weight": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.77.up_proj.weight_scale": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.78.down_proj.weight": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.78.down_proj.weight_scale": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.78.gate_proj.weight": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.78.gate_proj.weight_scale": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.78.up_proj.weight": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.78.up_proj.weight_scale": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.79.down_proj.weight": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.79.down_proj.weight_scale": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.79.gate_proj.weight": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.79.gate_proj.weight_scale": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.79.up_proj.weight": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.79.up_proj.weight_scale": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.8.down_proj.weight": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.8.down_proj.weight_scale": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.8.gate_proj.weight": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.8.gate_proj.weight_scale": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.8.up_proj.weight": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.8.up_proj.weight_scale": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.80.down_proj.weight": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.80.down_proj.weight_scale": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.80.gate_proj.weight": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.80.gate_proj.weight_scale": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.80.up_proj.weight": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.80.up_proj.weight_scale": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.81.down_proj.weight": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.81.down_proj.weight_scale": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.81.gate_proj.weight": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.81.gate_proj.weight_scale": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.81.up_proj.weight": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.81.up_proj.weight_scale": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.82.down_proj.weight": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.82.down_proj.weight_scale": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.82.gate_proj.weight": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.82.gate_proj.weight_scale": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.82.up_proj.weight": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.82.up_proj.weight_scale": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.83.down_proj.weight": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.83.down_proj.weight_scale": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.83.gate_proj.weight": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.83.gate_proj.weight_scale": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.83.up_proj.weight": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.83.up_proj.weight_scale": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.84.down_proj.weight": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.84.down_proj.weight_scale": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.84.gate_proj.weight": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.84.gate_proj.weight_scale": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.84.up_proj.weight": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.84.up_proj.weight_scale": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.85.down_proj.weight": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.85.down_proj.weight_scale": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.85.gate_proj.weight": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.85.gate_proj.weight_scale": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.85.up_proj.weight": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.85.up_proj.weight_scale": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.86.down_proj.weight": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.86.down_proj.weight_scale": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.86.gate_proj.weight": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.86.gate_proj.weight_scale": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.86.up_proj.weight": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.86.up_proj.weight_scale": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.87.down_proj.weight": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.87.down_proj.weight_scale": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.87.gate_proj.weight": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.87.gate_proj.weight_scale": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.87.up_proj.weight": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.87.up_proj.weight_scale": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.88.down_proj.weight": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.88.down_proj.weight_scale": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.88.gate_proj.weight": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.88.gate_proj.weight_scale": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.88.up_proj.weight": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.88.up_proj.weight_scale": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.89.down_proj.weight": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.89.down_proj.weight_scale": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.89.gate_proj.weight": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.89.gate_proj.weight_scale": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.89.up_proj.weight": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.89.up_proj.weight_scale": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.9.down_proj.weight": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.9.down_proj.weight_scale": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.9.gate_proj.weight": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.9.gate_proj.weight_scale": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.9.up_proj.weight": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.9.up_proj.weight_scale": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.90.down_proj.weight": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.90.down_proj.weight_scale": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.90.gate_proj.weight": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.90.gate_proj.weight_scale": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.90.up_proj.weight": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.90.up_proj.weight_scale": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.91.down_proj.weight": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.91.down_proj.weight_scale": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.91.gate_proj.weight": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.91.gate_proj.weight_scale": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.91.up_proj.weight": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.91.up_proj.weight_scale": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.92.down_proj.weight": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.92.down_proj.weight_scale": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.92.gate_proj.weight": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.92.gate_proj.weight_scale": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.92.up_proj.weight": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.92.up_proj.weight_scale": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.93.down_proj.weight": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.93.down_proj.weight_scale": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.93.gate_proj.weight": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.93.gate_proj.weight_scale": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.93.up_proj.weight": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.93.up_proj.weight_scale": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.94.down_proj.weight": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.94.down_proj.weight_scale": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.94.gate_proj.weight": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.94.gate_proj.weight_scale": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.94.up_proj.weight": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.94.up_proj.weight_scale": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.95.down_proj.weight": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.95.down_proj.weight_scale": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.95.gate_proj.weight": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.95.gate_proj.weight_scale": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.95.up_proj.weight": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.95.up_proj.weight_scale": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.96.down_proj.weight": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.96.down_proj.weight_scale": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.96.gate_proj.weight": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.96.gate_proj.weight_scale": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.96.up_proj.weight": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.96.up_proj.weight_scale": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.97.down_proj.weight": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.97.down_proj.weight_scale": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.97.gate_proj.weight": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.97.gate_proj.weight_scale": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.97.up_proj.weight": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.97.up_proj.weight_scale": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.98.down_proj.weight": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.98.down_proj.weight_scale": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.98.gate_proj.weight": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.98.gate_proj.weight_scale": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.98.up_proj.weight": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.98.up_proj.weight_scale": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.99.down_proj.weight": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.99.down_proj.weight_scale": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.99.gate_proj.weight": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.99.gate_proj.weight_scale": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.99.up_proj.weight": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.99.up_proj.weight_scale": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.gate.e_score_correction_bias": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.gate.weight": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.shared_experts.down_proj.weight": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.shared_experts.down_proj.weight_scale": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.shared_experts.gate_proj.weight": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.shared_experts.gate_proj.weight_scale": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.shared_experts.up_proj.weight": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.shared_experts.up_proj.weight_scale": "model-00021-of-00092.safetensors",
+ "model.layers.20.post_attention_layernorm.weight": "model-00021-of-00092.safetensors",
+ "model.layers.20.self_attn.k_norm.weight": "model-00021-of-00092.safetensors",
+ "model.layers.20.self_attn.k_proj.bias": "model-00021-of-00092.safetensors",
+ "model.layers.20.self_attn.k_proj.weight": "model-00021-of-00092.safetensors",
+ "model.layers.20.self_attn.k_proj.weight_scale": "model-00021-of-00092.safetensors",
+ "model.layers.20.self_attn.o_proj.weight": "model-00021-of-00092.safetensors",
+ "model.layers.20.self_attn.o_proj.weight_scale": "model-00021-of-00092.safetensors",
+ "model.layers.20.self_attn.q_norm.weight": "model-00021-of-00092.safetensors",
+ "model.layers.20.self_attn.q_proj.bias": "model-00021-of-00092.safetensors",
+ "model.layers.20.self_attn.q_proj.weight": "model-00021-of-00092.safetensors",
+ "model.layers.20.self_attn.q_proj.weight_scale": "model-00021-of-00092.safetensors",
+ "model.layers.20.self_attn.v_proj.bias": "model-00021-of-00092.safetensors",
+ "model.layers.20.self_attn.v_proj.weight": "model-00021-of-00092.safetensors",
+ "model.layers.20.self_attn.v_proj.weight_scale": "model-00021-of-00092.safetensors",
+ "model.layers.21.input_layernorm.weight": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.0.down_proj.weight": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.0.down_proj.weight_scale": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.0.gate_proj.weight": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.0.gate_proj.weight_scale": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.0.up_proj.weight": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.0.up_proj.weight_scale": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.1.down_proj.weight": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.1.down_proj.weight_scale": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.1.gate_proj.weight": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.1.gate_proj.weight_scale": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.1.up_proj.weight": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.1.up_proj.weight_scale": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.10.down_proj.weight": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.10.down_proj.weight_scale": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.10.gate_proj.weight": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.10.gate_proj.weight_scale": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.10.up_proj.weight": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.10.up_proj.weight_scale": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.100.down_proj.weight": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.100.down_proj.weight_scale": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.100.gate_proj.weight": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.100.gate_proj.weight_scale": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.100.up_proj.weight": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.100.up_proj.weight_scale": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.101.down_proj.weight": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.101.down_proj.weight_scale": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.101.gate_proj.weight": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.101.gate_proj.weight_scale": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.101.up_proj.weight": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.101.up_proj.weight_scale": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.102.down_proj.weight": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.102.down_proj.weight_scale": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.102.gate_proj.weight": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.102.gate_proj.weight_scale": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.102.up_proj.weight": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.102.up_proj.weight_scale": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.103.down_proj.weight": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.103.down_proj.weight_scale": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.103.gate_proj.weight": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.103.gate_proj.weight_scale": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.103.up_proj.weight": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.103.up_proj.weight_scale": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.104.down_proj.weight": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.104.down_proj.weight_scale": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.104.gate_proj.weight": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.104.gate_proj.weight_scale": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.104.up_proj.weight": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.104.up_proj.weight_scale": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.105.down_proj.weight": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.105.down_proj.weight_scale": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.105.gate_proj.weight": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.105.gate_proj.weight_scale": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.105.up_proj.weight": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.105.up_proj.weight_scale": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.106.down_proj.weight": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.106.down_proj.weight_scale": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.106.gate_proj.weight": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.106.gate_proj.weight_scale": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.106.up_proj.weight": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.106.up_proj.weight_scale": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.107.down_proj.weight": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.107.down_proj.weight_scale": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.107.gate_proj.weight": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.107.gate_proj.weight_scale": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.107.up_proj.weight": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.107.up_proj.weight_scale": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.108.down_proj.weight": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.108.down_proj.weight_scale": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.108.gate_proj.weight": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.108.gate_proj.weight_scale": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.108.up_proj.weight": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.108.up_proj.weight_scale": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.109.down_proj.weight": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.109.down_proj.weight_scale": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.109.gate_proj.weight": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.109.gate_proj.weight_scale": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.109.up_proj.weight": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.109.up_proj.weight_scale": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.11.down_proj.weight": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.11.down_proj.weight_scale": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.11.gate_proj.weight": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.11.gate_proj.weight_scale": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.11.up_proj.weight": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.11.up_proj.weight_scale": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.110.down_proj.weight": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.110.down_proj.weight_scale": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.110.gate_proj.weight": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.110.gate_proj.weight_scale": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.110.up_proj.weight": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.110.up_proj.weight_scale": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.111.down_proj.weight": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.111.down_proj.weight_scale": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.111.gate_proj.weight": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.111.gate_proj.weight_scale": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.111.up_proj.weight": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.111.up_proj.weight_scale": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.112.down_proj.weight": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.112.down_proj.weight_scale": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.112.gate_proj.weight": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.112.gate_proj.weight_scale": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.112.up_proj.weight": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.112.up_proj.weight_scale": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.113.down_proj.weight": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.113.down_proj.weight_scale": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.113.gate_proj.weight": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.113.gate_proj.weight_scale": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.113.up_proj.weight": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.113.up_proj.weight_scale": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.114.down_proj.weight": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.114.down_proj.weight_scale": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.114.gate_proj.weight": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.114.gate_proj.weight_scale": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.114.up_proj.weight": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.114.up_proj.weight_scale": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.115.down_proj.weight": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.115.down_proj.weight_scale": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.115.gate_proj.weight": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.115.gate_proj.weight_scale": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.115.up_proj.weight": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.115.up_proj.weight_scale": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.116.down_proj.weight": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.116.down_proj.weight_scale": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.116.gate_proj.weight": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.116.gate_proj.weight_scale": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.116.up_proj.weight": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.116.up_proj.weight_scale": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.117.down_proj.weight": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.117.down_proj.weight_scale": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.117.gate_proj.weight": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.117.gate_proj.weight_scale": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.117.up_proj.weight": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.117.up_proj.weight_scale": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.118.down_proj.weight": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.118.down_proj.weight_scale": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.118.gate_proj.weight": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.118.gate_proj.weight_scale": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.118.up_proj.weight": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.118.up_proj.weight_scale": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.119.down_proj.weight": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.119.down_proj.weight_scale": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.119.gate_proj.weight": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.119.gate_proj.weight_scale": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.119.up_proj.weight": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.119.up_proj.weight_scale": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.12.down_proj.weight": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.12.down_proj.weight_scale": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.12.gate_proj.weight": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.12.gate_proj.weight_scale": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.12.up_proj.weight": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.12.up_proj.weight_scale": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.120.down_proj.weight": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.120.down_proj.weight_scale": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.120.gate_proj.weight": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.120.gate_proj.weight_scale": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.120.up_proj.weight": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.120.up_proj.weight_scale": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.121.down_proj.weight": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.121.down_proj.weight_scale": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.121.gate_proj.weight": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.121.gate_proj.weight_scale": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.121.up_proj.weight": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.121.up_proj.weight_scale": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.122.down_proj.weight": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.122.down_proj.weight_scale": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.122.gate_proj.weight": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.122.gate_proj.weight_scale": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.122.up_proj.weight": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.122.up_proj.weight_scale": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.123.down_proj.weight": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.123.down_proj.weight_scale": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.123.gate_proj.weight": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.123.gate_proj.weight_scale": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.123.up_proj.weight": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.123.up_proj.weight_scale": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.124.down_proj.weight": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.124.down_proj.weight_scale": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.124.gate_proj.weight": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.124.gate_proj.weight_scale": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.124.up_proj.weight": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.124.up_proj.weight_scale": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.125.down_proj.weight": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.125.down_proj.weight_scale": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.125.gate_proj.weight": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.125.gate_proj.weight_scale": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.125.up_proj.weight": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.125.up_proj.weight_scale": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.126.down_proj.weight": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.126.down_proj.weight_scale": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.126.gate_proj.weight": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.126.gate_proj.weight_scale": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.126.up_proj.weight": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.126.up_proj.weight_scale": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.127.down_proj.weight": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.127.down_proj.weight_scale": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.127.gate_proj.weight": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.127.gate_proj.weight_scale": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.127.up_proj.weight": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.127.up_proj.weight_scale": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.128.down_proj.weight": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.128.down_proj.weight_scale": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.128.gate_proj.weight": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.128.gate_proj.weight_scale": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.128.up_proj.weight": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.128.up_proj.weight_scale": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.129.down_proj.weight": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.129.down_proj.weight_scale": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.129.gate_proj.weight": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.129.gate_proj.weight_scale": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.129.up_proj.weight": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.129.up_proj.weight_scale": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.13.down_proj.weight": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.13.down_proj.weight_scale": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.13.gate_proj.weight": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.13.gate_proj.weight_scale": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.13.up_proj.weight": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.13.up_proj.weight_scale": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.130.down_proj.weight": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.130.down_proj.weight_scale": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.130.gate_proj.weight": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.130.gate_proj.weight_scale": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.130.up_proj.weight": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.130.up_proj.weight_scale": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.131.down_proj.weight": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.131.down_proj.weight_scale": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.131.gate_proj.weight": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.131.gate_proj.weight_scale": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.131.up_proj.weight": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.131.up_proj.weight_scale": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.132.down_proj.weight": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.132.down_proj.weight_scale": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.132.gate_proj.weight": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.132.gate_proj.weight_scale": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.132.up_proj.weight": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.132.up_proj.weight_scale": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.133.down_proj.weight": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.133.down_proj.weight_scale": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.133.gate_proj.weight": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.133.gate_proj.weight_scale": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.133.up_proj.weight": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.133.up_proj.weight_scale": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.134.down_proj.weight": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.134.down_proj.weight_scale": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.134.gate_proj.weight": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.134.gate_proj.weight_scale": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.134.up_proj.weight": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.134.up_proj.weight_scale": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.135.down_proj.weight": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.135.down_proj.weight_scale": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.135.gate_proj.weight": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.135.gate_proj.weight_scale": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.135.up_proj.weight": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.135.up_proj.weight_scale": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.136.down_proj.weight": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.136.down_proj.weight_scale": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.136.gate_proj.weight": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.136.gate_proj.weight_scale": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.136.up_proj.weight": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.136.up_proj.weight_scale": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.137.down_proj.weight": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.137.down_proj.weight_scale": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.137.gate_proj.weight": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.137.gate_proj.weight_scale": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.137.up_proj.weight": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.137.up_proj.weight_scale": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.138.down_proj.weight": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.138.down_proj.weight_scale": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.138.gate_proj.weight": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.138.gate_proj.weight_scale": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.138.up_proj.weight": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.138.up_proj.weight_scale": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.139.down_proj.weight": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.139.down_proj.weight_scale": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.139.gate_proj.weight": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.139.gate_proj.weight_scale": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.139.up_proj.weight": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.139.up_proj.weight_scale": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.14.down_proj.weight": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.14.down_proj.weight_scale": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.14.gate_proj.weight": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.14.gate_proj.weight_scale": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.14.up_proj.weight": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.14.up_proj.weight_scale": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.140.down_proj.weight": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.140.down_proj.weight_scale": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.140.gate_proj.weight": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.140.gate_proj.weight_scale": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.140.up_proj.weight": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.140.up_proj.weight_scale": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.141.down_proj.weight": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.141.down_proj.weight_scale": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.141.gate_proj.weight": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.141.gate_proj.weight_scale": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.141.up_proj.weight": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.141.up_proj.weight_scale": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.142.down_proj.weight": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.142.down_proj.weight_scale": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.142.gate_proj.weight": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.142.gate_proj.weight_scale": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.142.up_proj.weight": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.142.up_proj.weight_scale": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.143.down_proj.weight": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.143.down_proj.weight_scale": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.143.gate_proj.weight": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.143.gate_proj.weight_scale": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.143.up_proj.weight": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.143.up_proj.weight_scale": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.144.down_proj.weight": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.144.down_proj.weight_scale": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.144.gate_proj.weight": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.144.gate_proj.weight_scale": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.144.up_proj.weight": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.144.up_proj.weight_scale": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.145.down_proj.weight": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.145.down_proj.weight_scale": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.145.gate_proj.weight": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.145.gate_proj.weight_scale": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.145.up_proj.weight": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.145.up_proj.weight_scale": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.146.down_proj.weight": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.146.down_proj.weight_scale": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.146.gate_proj.weight": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.146.gate_proj.weight_scale": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.146.up_proj.weight": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.146.up_proj.weight_scale": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.147.down_proj.weight": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.147.down_proj.weight_scale": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.147.gate_proj.weight": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.147.gate_proj.weight_scale": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.147.up_proj.weight": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.147.up_proj.weight_scale": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.148.down_proj.weight": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.148.down_proj.weight_scale": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.148.gate_proj.weight": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.148.gate_proj.weight_scale": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.148.up_proj.weight": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.148.up_proj.weight_scale": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.149.down_proj.weight": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.149.down_proj.weight_scale": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.149.gate_proj.weight": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.149.gate_proj.weight_scale": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.149.up_proj.weight": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.149.up_proj.weight_scale": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.15.down_proj.weight": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.15.down_proj.weight_scale": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.15.gate_proj.weight": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.15.gate_proj.weight_scale": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.15.up_proj.weight": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.15.up_proj.weight_scale": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.150.down_proj.weight": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.150.down_proj.weight_scale": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.150.gate_proj.weight": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.150.gate_proj.weight_scale": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.150.up_proj.weight": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.150.up_proj.weight_scale": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.151.down_proj.weight": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.151.down_proj.weight_scale": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.151.gate_proj.weight": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.151.gate_proj.weight_scale": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.151.up_proj.weight": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.151.up_proj.weight_scale": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.152.down_proj.weight": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.152.down_proj.weight_scale": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.152.gate_proj.weight": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.152.gate_proj.weight_scale": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.152.up_proj.weight": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.152.up_proj.weight_scale": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.153.down_proj.weight": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.153.down_proj.weight_scale": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.153.gate_proj.weight": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.153.gate_proj.weight_scale": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.153.up_proj.weight": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.153.up_proj.weight_scale": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.154.down_proj.weight": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.154.down_proj.weight_scale": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.154.gate_proj.weight": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.154.gate_proj.weight_scale": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.154.up_proj.weight": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.154.up_proj.weight_scale": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.155.down_proj.weight": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.155.down_proj.weight_scale": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.155.gate_proj.weight": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.155.gate_proj.weight_scale": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.155.up_proj.weight": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.155.up_proj.weight_scale": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.156.down_proj.weight": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.156.down_proj.weight_scale": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.156.gate_proj.weight": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.156.gate_proj.weight_scale": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.156.up_proj.weight": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.156.up_proj.weight_scale": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.157.down_proj.weight": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.157.down_proj.weight_scale": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.157.gate_proj.weight": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.157.gate_proj.weight_scale": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.157.up_proj.weight": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.157.up_proj.weight_scale": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.158.down_proj.weight": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.158.down_proj.weight_scale": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.158.gate_proj.weight": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.158.gate_proj.weight_scale": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.158.up_proj.weight": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.158.up_proj.weight_scale": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.159.down_proj.weight": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.159.down_proj.weight_scale": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.159.gate_proj.weight": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.159.gate_proj.weight_scale": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.159.up_proj.weight": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.159.up_proj.weight_scale": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.16.down_proj.weight": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.16.down_proj.weight_scale": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.16.gate_proj.weight": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.16.gate_proj.weight_scale": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.16.up_proj.weight": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.16.up_proj.weight_scale": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.17.down_proj.weight": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.17.down_proj.weight_scale": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.17.gate_proj.weight": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.17.gate_proj.weight_scale": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.17.up_proj.weight": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.17.up_proj.weight_scale": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.18.down_proj.weight": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.18.down_proj.weight_scale": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.18.gate_proj.weight": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.18.gate_proj.weight_scale": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.18.up_proj.weight": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.18.up_proj.weight_scale": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.19.down_proj.weight": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.19.down_proj.weight_scale": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.19.gate_proj.weight": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.19.gate_proj.weight_scale": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.19.up_proj.weight": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.19.up_proj.weight_scale": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.2.down_proj.weight": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.2.down_proj.weight_scale": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.2.gate_proj.weight": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.2.gate_proj.weight_scale": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.2.up_proj.weight": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.2.up_proj.weight_scale": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.20.down_proj.weight": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.20.down_proj.weight_scale": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.20.gate_proj.weight": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.20.gate_proj.weight_scale": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.20.up_proj.weight": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.20.up_proj.weight_scale": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.21.down_proj.weight": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.21.down_proj.weight_scale": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.21.gate_proj.weight": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.21.gate_proj.weight_scale": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.21.up_proj.weight": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.21.up_proj.weight_scale": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.22.down_proj.weight": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.22.down_proj.weight_scale": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.22.gate_proj.weight": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.22.gate_proj.weight_scale": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.22.up_proj.weight": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.22.up_proj.weight_scale": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.23.down_proj.weight": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.23.down_proj.weight_scale": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.23.gate_proj.weight": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.23.gate_proj.weight_scale": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.23.up_proj.weight": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.23.up_proj.weight_scale": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.24.down_proj.weight": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.24.down_proj.weight_scale": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.24.gate_proj.weight": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.24.gate_proj.weight_scale": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.24.up_proj.weight": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.24.up_proj.weight_scale": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.25.down_proj.weight": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.25.down_proj.weight_scale": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.25.gate_proj.weight": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.25.gate_proj.weight_scale": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.25.up_proj.weight": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.25.up_proj.weight_scale": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.26.down_proj.weight": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.26.down_proj.weight_scale": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.26.gate_proj.weight": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.26.gate_proj.weight_scale": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.26.up_proj.weight": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.26.up_proj.weight_scale": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.27.down_proj.weight": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.27.down_proj.weight_scale": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.27.gate_proj.weight": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.27.gate_proj.weight_scale": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.27.up_proj.weight": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.27.up_proj.weight_scale": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.28.down_proj.weight": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.28.down_proj.weight_scale": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.28.gate_proj.weight": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.28.gate_proj.weight_scale": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.28.up_proj.weight": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.28.up_proj.weight_scale": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.29.down_proj.weight": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.29.down_proj.weight_scale": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.29.gate_proj.weight": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.29.gate_proj.weight_scale": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.29.up_proj.weight": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.29.up_proj.weight_scale": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.3.down_proj.weight": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.3.down_proj.weight_scale": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.3.gate_proj.weight": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.3.gate_proj.weight_scale": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.3.up_proj.weight": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.3.up_proj.weight_scale": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.30.down_proj.weight": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.30.down_proj.weight_scale": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.30.gate_proj.weight": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.30.gate_proj.weight_scale": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.30.up_proj.weight": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.30.up_proj.weight_scale": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.31.down_proj.weight": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.31.down_proj.weight_scale": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.31.gate_proj.weight": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.31.gate_proj.weight_scale": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.31.up_proj.weight": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.31.up_proj.weight_scale": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.32.down_proj.weight": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.32.down_proj.weight_scale": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.32.gate_proj.weight": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.32.gate_proj.weight_scale": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.32.up_proj.weight": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.32.up_proj.weight_scale": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.33.down_proj.weight": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.33.down_proj.weight_scale": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.33.gate_proj.weight": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.33.gate_proj.weight_scale": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.33.up_proj.weight": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.33.up_proj.weight_scale": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.34.down_proj.weight": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.34.down_proj.weight_scale": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.34.gate_proj.weight": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.34.gate_proj.weight_scale": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.34.up_proj.weight": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.34.up_proj.weight_scale": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.35.down_proj.weight": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.35.down_proj.weight_scale": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.35.gate_proj.weight": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.35.gate_proj.weight_scale": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.35.up_proj.weight": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.35.up_proj.weight_scale": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.36.down_proj.weight": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.36.down_proj.weight_scale": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.36.gate_proj.weight": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.36.gate_proj.weight_scale": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.36.up_proj.weight": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.36.up_proj.weight_scale": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.37.down_proj.weight": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.37.down_proj.weight_scale": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.37.gate_proj.weight": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.37.gate_proj.weight_scale": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.37.up_proj.weight": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.37.up_proj.weight_scale": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.38.down_proj.weight": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.38.down_proj.weight_scale": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.38.gate_proj.weight": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.38.gate_proj.weight_scale": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.38.up_proj.weight": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.38.up_proj.weight_scale": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.39.down_proj.weight": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.39.down_proj.weight_scale": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.39.gate_proj.weight": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.39.gate_proj.weight_scale": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.39.up_proj.weight": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.39.up_proj.weight_scale": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.4.down_proj.weight": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.4.down_proj.weight_scale": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.4.gate_proj.weight": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.4.gate_proj.weight_scale": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.4.up_proj.weight": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.4.up_proj.weight_scale": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.40.down_proj.weight": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.40.down_proj.weight_scale": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.40.gate_proj.weight": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.40.gate_proj.weight_scale": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.40.up_proj.weight": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.40.up_proj.weight_scale": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.41.down_proj.weight": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.41.down_proj.weight_scale": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.41.gate_proj.weight": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.41.gate_proj.weight_scale": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.41.up_proj.weight": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.41.up_proj.weight_scale": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.42.down_proj.weight": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.42.down_proj.weight_scale": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.42.gate_proj.weight": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.42.gate_proj.weight_scale": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.42.up_proj.weight": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.42.up_proj.weight_scale": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.43.down_proj.weight": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.43.down_proj.weight_scale": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.43.gate_proj.weight": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.43.gate_proj.weight_scale": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.43.up_proj.weight": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.43.up_proj.weight_scale": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.44.down_proj.weight": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.44.down_proj.weight_scale": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.44.gate_proj.weight": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.44.gate_proj.weight_scale": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.44.up_proj.weight": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.44.up_proj.weight_scale": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.45.down_proj.weight": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.45.down_proj.weight_scale": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.45.gate_proj.weight": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.45.gate_proj.weight_scale": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.45.up_proj.weight": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.45.up_proj.weight_scale": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.46.down_proj.weight": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.46.down_proj.weight_scale": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.46.gate_proj.weight": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.46.gate_proj.weight_scale": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.46.up_proj.weight": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.46.up_proj.weight_scale": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.47.down_proj.weight": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.47.down_proj.weight_scale": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.47.gate_proj.weight": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.47.gate_proj.weight_scale": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.47.up_proj.weight": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.47.up_proj.weight_scale": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.48.down_proj.weight": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.48.down_proj.weight_scale": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.48.gate_proj.weight": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.48.gate_proj.weight_scale": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.48.up_proj.weight": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.48.up_proj.weight_scale": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.49.down_proj.weight": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.49.down_proj.weight_scale": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.49.gate_proj.weight": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.49.gate_proj.weight_scale": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.49.up_proj.weight": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.49.up_proj.weight_scale": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.5.down_proj.weight": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.5.down_proj.weight_scale": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.5.gate_proj.weight": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.5.gate_proj.weight_scale": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.5.up_proj.weight": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.5.up_proj.weight_scale": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.50.down_proj.weight": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.50.down_proj.weight_scale": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.50.gate_proj.weight": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.50.gate_proj.weight_scale": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.50.up_proj.weight": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.50.up_proj.weight_scale": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.51.down_proj.weight": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.51.down_proj.weight_scale": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.51.gate_proj.weight": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.51.gate_proj.weight_scale": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.51.up_proj.weight": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.51.up_proj.weight_scale": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.52.down_proj.weight": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.52.down_proj.weight_scale": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.52.gate_proj.weight": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.52.gate_proj.weight_scale": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.52.up_proj.weight": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.52.up_proj.weight_scale": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.53.down_proj.weight": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.53.down_proj.weight_scale": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.53.gate_proj.weight": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.53.gate_proj.weight_scale": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.53.up_proj.weight": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.53.up_proj.weight_scale": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.54.down_proj.weight": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.54.down_proj.weight_scale": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.54.gate_proj.weight": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.54.gate_proj.weight_scale": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.54.up_proj.weight": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.54.up_proj.weight_scale": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.55.down_proj.weight": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.55.down_proj.weight_scale": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.55.gate_proj.weight": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.55.gate_proj.weight_scale": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.55.up_proj.weight": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.55.up_proj.weight_scale": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.56.down_proj.weight": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.56.down_proj.weight_scale": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.56.gate_proj.weight": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.56.gate_proj.weight_scale": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.56.up_proj.weight": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.56.up_proj.weight_scale": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.57.down_proj.weight": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.57.down_proj.weight_scale": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.57.gate_proj.weight": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.57.gate_proj.weight_scale": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.57.up_proj.weight": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.57.up_proj.weight_scale": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.58.down_proj.weight": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.58.down_proj.weight_scale": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.58.gate_proj.weight": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.58.gate_proj.weight_scale": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.58.up_proj.weight": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.58.up_proj.weight_scale": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.59.down_proj.weight": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.59.down_proj.weight_scale": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.59.gate_proj.weight": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.59.gate_proj.weight_scale": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.59.up_proj.weight": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.59.up_proj.weight_scale": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.6.down_proj.weight": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.6.down_proj.weight_scale": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.6.gate_proj.weight": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.6.gate_proj.weight_scale": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.6.up_proj.weight": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.6.up_proj.weight_scale": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.60.down_proj.weight": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.60.down_proj.weight_scale": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.60.gate_proj.weight": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.60.gate_proj.weight_scale": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.60.up_proj.weight": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.60.up_proj.weight_scale": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.61.down_proj.weight": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.61.down_proj.weight_scale": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.61.gate_proj.weight": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.61.gate_proj.weight_scale": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.61.up_proj.weight": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.61.up_proj.weight_scale": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.62.down_proj.weight": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.62.down_proj.weight_scale": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.62.gate_proj.weight": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.62.gate_proj.weight_scale": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.62.up_proj.weight": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.62.up_proj.weight_scale": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.63.down_proj.weight": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.63.down_proj.weight_scale": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.63.gate_proj.weight": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.63.gate_proj.weight_scale": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.63.up_proj.weight": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.63.up_proj.weight_scale": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.64.down_proj.weight": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.64.down_proj.weight_scale": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.64.gate_proj.weight": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.64.gate_proj.weight_scale": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.64.up_proj.weight": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.64.up_proj.weight_scale": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.65.down_proj.weight": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.65.down_proj.weight_scale": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.65.gate_proj.weight": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.65.gate_proj.weight_scale": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.65.up_proj.weight": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.65.up_proj.weight_scale": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.66.down_proj.weight": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.66.down_proj.weight_scale": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.66.gate_proj.weight": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.66.gate_proj.weight_scale": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.66.up_proj.weight": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.66.up_proj.weight_scale": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.67.down_proj.weight": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.67.down_proj.weight_scale": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.67.gate_proj.weight": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.67.gate_proj.weight_scale": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.67.up_proj.weight": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.67.up_proj.weight_scale": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.68.down_proj.weight": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.68.down_proj.weight_scale": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.68.gate_proj.weight": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.68.gate_proj.weight_scale": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.68.up_proj.weight": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.68.up_proj.weight_scale": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.69.down_proj.weight": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.69.down_proj.weight_scale": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.69.gate_proj.weight": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.69.gate_proj.weight_scale": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.69.up_proj.weight": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.69.up_proj.weight_scale": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.7.down_proj.weight": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.7.down_proj.weight_scale": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.7.gate_proj.weight": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.7.gate_proj.weight_scale": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.7.up_proj.weight": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.7.up_proj.weight_scale": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.70.down_proj.weight": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.70.down_proj.weight_scale": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.70.gate_proj.weight": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.70.gate_proj.weight_scale": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.70.up_proj.weight": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.70.up_proj.weight_scale": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.71.down_proj.weight": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.71.down_proj.weight_scale": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.71.gate_proj.weight": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.71.gate_proj.weight_scale": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.71.up_proj.weight": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.71.up_proj.weight_scale": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.72.down_proj.weight": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.72.down_proj.weight_scale": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.72.gate_proj.weight": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.72.gate_proj.weight_scale": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.72.up_proj.weight": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.72.up_proj.weight_scale": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.73.down_proj.weight": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.73.down_proj.weight_scale": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.73.gate_proj.weight": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.73.gate_proj.weight_scale": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.73.up_proj.weight": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.73.up_proj.weight_scale": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.74.down_proj.weight": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.74.down_proj.weight_scale": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.74.gate_proj.weight": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.74.gate_proj.weight_scale": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.74.up_proj.weight": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.74.up_proj.weight_scale": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.75.down_proj.weight": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.75.down_proj.weight_scale": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.75.gate_proj.weight": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.75.gate_proj.weight_scale": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.75.up_proj.weight": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.75.up_proj.weight_scale": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.76.down_proj.weight": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.76.down_proj.weight_scale": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.76.gate_proj.weight": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.76.gate_proj.weight_scale": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.76.up_proj.weight": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.76.up_proj.weight_scale": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.77.down_proj.weight": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.77.down_proj.weight_scale": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.77.gate_proj.weight": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.77.gate_proj.weight_scale": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.77.up_proj.weight": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.77.up_proj.weight_scale": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.78.down_proj.weight": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.78.down_proj.weight_scale": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.78.gate_proj.weight": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.78.gate_proj.weight_scale": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.78.up_proj.weight": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.78.up_proj.weight_scale": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.79.down_proj.weight": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.79.down_proj.weight_scale": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.79.gate_proj.weight": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.79.gate_proj.weight_scale": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.79.up_proj.weight": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.79.up_proj.weight_scale": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.8.down_proj.weight": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.8.down_proj.weight_scale": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.8.gate_proj.weight": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.8.gate_proj.weight_scale": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.8.up_proj.weight": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.8.up_proj.weight_scale": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.80.down_proj.weight": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.80.down_proj.weight_scale": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.80.gate_proj.weight": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.80.gate_proj.weight_scale": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.80.up_proj.weight": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.80.up_proj.weight_scale": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.81.down_proj.weight": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.81.down_proj.weight_scale": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.81.gate_proj.weight": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.81.gate_proj.weight_scale": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.81.up_proj.weight": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.81.up_proj.weight_scale": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.82.down_proj.weight": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.82.down_proj.weight_scale": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.82.gate_proj.weight": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.82.gate_proj.weight_scale": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.82.up_proj.weight": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.82.up_proj.weight_scale": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.83.down_proj.weight": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.83.down_proj.weight_scale": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.83.gate_proj.weight": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.83.gate_proj.weight_scale": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.83.up_proj.weight": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.83.up_proj.weight_scale": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.84.down_proj.weight": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.84.down_proj.weight_scale": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.84.gate_proj.weight": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.84.gate_proj.weight_scale": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.84.up_proj.weight": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.84.up_proj.weight_scale": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.85.down_proj.weight": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.85.down_proj.weight_scale": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.85.gate_proj.weight": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.85.gate_proj.weight_scale": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.85.up_proj.weight": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.85.up_proj.weight_scale": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.86.down_proj.weight": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.86.down_proj.weight_scale": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.86.gate_proj.weight": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.86.gate_proj.weight_scale": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.86.up_proj.weight": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.86.up_proj.weight_scale": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.87.down_proj.weight": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.87.down_proj.weight_scale": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.87.gate_proj.weight": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.87.gate_proj.weight_scale": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.87.up_proj.weight": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.87.up_proj.weight_scale": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.88.down_proj.weight": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.88.down_proj.weight_scale": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.88.gate_proj.weight": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.88.gate_proj.weight_scale": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.88.up_proj.weight": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.88.up_proj.weight_scale": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.89.down_proj.weight": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.89.down_proj.weight_scale": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.89.gate_proj.weight": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.89.gate_proj.weight_scale": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.89.up_proj.weight": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.89.up_proj.weight_scale": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.9.down_proj.weight": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.9.down_proj.weight_scale": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.9.gate_proj.weight": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.9.gate_proj.weight_scale": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.9.up_proj.weight": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.9.up_proj.weight_scale": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.90.down_proj.weight": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.90.down_proj.weight_scale": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.90.gate_proj.weight": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.90.gate_proj.weight_scale": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.90.up_proj.weight": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.90.up_proj.weight_scale": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.91.down_proj.weight": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.91.down_proj.weight_scale": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.91.gate_proj.weight": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.91.gate_proj.weight_scale": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.91.up_proj.weight": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.91.up_proj.weight_scale": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.92.down_proj.weight": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.92.down_proj.weight_scale": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.92.gate_proj.weight": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.92.gate_proj.weight_scale": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.92.up_proj.weight": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.92.up_proj.weight_scale": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.93.down_proj.weight": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.93.down_proj.weight_scale": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.93.gate_proj.weight": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.93.gate_proj.weight_scale": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.93.up_proj.weight": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.93.up_proj.weight_scale": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.94.down_proj.weight": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.94.down_proj.weight_scale": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.94.gate_proj.weight": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.94.gate_proj.weight_scale": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.94.up_proj.weight": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.94.up_proj.weight_scale": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.95.down_proj.weight": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.95.down_proj.weight_scale": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.95.gate_proj.weight": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.95.gate_proj.weight_scale": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.95.up_proj.weight": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.95.up_proj.weight_scale": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.96.down_proj.weight": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.96.down_proj.weight_scale": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.96.gate_proj.weight": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.96.gate_proj.weight_scale": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.96.up_proj.weight": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.96.up_proj.weight_scale": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.97.down_proj.weight": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.97.down_proj.weight_scale": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.97.gate_proj.weight": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.97.gate_proj.weight_scale": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.97.up_proj.weight": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.97.up_proj.weight_scale": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.98.down_proj.weight": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.98.down_proj.weight_scale": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.98.gate_proj.weight": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.98.gate_proj.weight_scale": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.98.up_proj.weight": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.98.up_proj.weight_scale": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.99.down_proj.weight": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.99.down_proj.weight_scale": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.99.gate_proj.weight": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.99.gate_proj.weight_scale": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.99.up_proj.weight": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.99.up_proj.weight_scale": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.gate.e_score_correction_bias": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.gate.weight": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.shared_experts.down_proj.weight": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.shared_experts.down_proj.weight_scale": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.shared_experts.gate_proj.weight": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.shared_experts.gate_proj.weight_scale": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.shared_experts.up_proj.weight": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.shared_experts.up_proj.weight_scale": "model-00022-of-00092.safetensors",
+ "model.layers.21.post_attention_layernorm.weight": "model-00022-of-00092.safetensors",
+ "model.layers.21.self_attn.k_norm.weight": "model-00022-of-00092.safetensors",
+ "model.layers.21.self_attn.k_proj.bias": "model-00022-of-00092.safetensors",
+ "model.layers.21.self_attn.k_proj.weight": "model-00022-of-00092.safetensors",
+ "model.layers.21.self_attn.k_proj.weight_scale": "model-00022-of-00092.safetensors",
+ "model.layers.21.self_attn.o_proj.weight": "model-00022-of-00092.safetensors",
+ "model.layers.21.self_attn.o_proj.weight_scale": "model-00022-of-00092.safetensors",
+ "model.layers.21.self_attn.q_norm.weight": "model-00022-of-00092.safetensors",
+ "model.layers.21.self_attn.q_proj.bias": "model-00022-of-00092.safetensors",
+ "model.layers.21.self_attn.q_proj.weight": "model-00022-of-00092.safetensors",
+ "model.layers.21.self_attn.q_proj.weight_scale": "model-00022-of-00092.safetensors",
+ "model.layers.21.self_attn.v_proj.bias": "model-00022-of-00092.safetensors",
+ "model.layers.21.self_attn.v_proj.weight": "model-00022-of-00092.safetensors",
+ "model.layers.21.self_attn.v_proj.weight_scale": "model-00022-of-00092.safetensors",
+ "model.layers.22.input_layernorm.weight": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.0.down_proj.weight": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.0.down_proj.weight_scale": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.0.gate_proj.weight": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.0.gate_proj.weight_scale": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.0.up_proj.weight": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.0.up_proj.weight_scale": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.1.down_proj.weight": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.1.down_proj.weight_scale": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.1.gate_proj.weight": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.1.gate_proj.weight_scale": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.1.up_proj.weight": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.1.up_proj.weight_scale": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.10.down_proj.weight": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.10.down_proj.weight_scale": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.10.gate_proj.weight": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.10.gate_proj.weight_scale": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.10.up_proj.weight": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.10.up_proj.weight_scale": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.100.down_proj.weight": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.100.down_proj.weight_scale": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.100.gate_proj.weight": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.100.gate_proj.weight_scale": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.100.up_proj.weight": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.100.up_proj.weight_scale": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.101.down_proj.weight": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.101.down_proj.weight_scale": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.101.gate_proj.weight": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.101.gate_proj.weight_scale": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.101.up_proj.weight": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.101.up_proj.weight_scale": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.102.down_proj.weight": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.102.down_proj.weight_scale": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.102.gate_proj.weight": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.102.gate_proj.weight_scale": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.102.up_proj.weight": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.102.up_proj.weight_scale": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.103.down_proj.weight": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.103.down_proj.weight_scale": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.103.gate_proj.weight": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.103.gate_proj.weight_scale": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.103.up_proj.weight": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.103.up_proj.weight_scale": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.104.down_proj.weight": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.104.down_proj.weight_scale": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.104.gate_proj.weight": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.104.gate_proj.weight_scale": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.104.up_proj.weight": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.104.up_proj.weight_scale": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.105.down_proj.weight": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.105.down_proj.weight_scale": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.105.gate_proj.weight": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.105.gate_proj.weight_scale": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.105.up_proj.weight": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.105.up_proj.weight_scale": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.106.down_proj.weight": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.106.down_proj.weight_scale": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.106.gate_proj.weight": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.106.gate_proj.weight_scale": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.106.up_proj.weight": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.106.up_proj.weight_scale": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.107.down_proj.weight": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.107.down_proj.weight_scale": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.107.gate_proj.weight": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.107.gate_proj.weight_scale": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.107.up_proj.weight": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.107.up_proj.weight_scale": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.108.down_proj.weight": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.108.down_proj.weight_scale": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.108.gate_proj.weight": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.108.gate_proj.weight_scale": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.108.up_proj.weight": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.108.up_proj.weight_scale": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.109.down_proj.weight": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.109.down_proj.weight_scale": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.109.gate_proj.weight": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.109.gate_proj.weight_scale": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.109.up_proj.weight": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.109.up_proj.weight_scale": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.11.down_proj.weight": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.11.down_proj.weight_scale": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.11.gate_proj.weight": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.11.gate_proj.weight_scale": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.11.up_proj.weight": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.11.up_proj.weight_scale": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.110.down_proj.weight": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.110.down_proj.weight_scale": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.110.gate_proj.weight": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.110.gate_proj.weight_scale": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.110.up_proj.weight": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.110.up_proj.weight_scale": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.111.down_proj.weight": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.111.down_proj.weight_scale": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.111.gate_proj.weight": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.111.gate_proj.weight_scale": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.111.up_proj.weight": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.111.up_proj.weight_scale": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.112.down_proj.weight": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.112.down_proj.weight_scale": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.112.gate_proj.weight": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.112.gate_proj.weight_scale": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.112.up_proj.weight": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.112.up_proj.weight_scale": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.113.down_proj.weight": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.113.down_proj.weight_scale": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.113.gate_proj.weight": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.113.gate_proj.weight_scale": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.113.up_proj.weight": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.113.up_proj.weight_scale": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.114.down_proj.weight": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.114.down_proj.weight_scale": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.114.gate_proj.weight": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.114.gate_proj.weight_scale": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.114.up_proj.weight": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.114.up_proj.weight_scale": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.115.down_proj.weight": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.115.down_proj.weight_scale": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.115.gate_proj.weight": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.115.gate_proj.weight_scale": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.115.up_proj.weight": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.115.up_proj.weight_scale": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.116.down_proj.weight": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.116.down_proj.weight_scale": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.116.gate_proj.weight": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.116.gate_proj.weight_scale": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.116.up_proj.weight": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.116.up_proj.weight_scale": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.117.down_proj.weight": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.117.down_proj.weight_scale": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.117.gate_proj.weight": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.117.gate_proj.weight_scale": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.117.up_proj.weight": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.117.up_proj.weight_scale": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.118.down_proj.weight": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.118.down_proj.weight_scale": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.118.gate_proj.weight": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.118.gate_proj.weight_scale": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.118.up_proj.weight": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.118.up_proj.weight_scale": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.119.down_proj.weight": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.119.down_proj.weight_scale": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.119.gate_proj.weight": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.119.gate_proj.weight_scale": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.119.up_proj.weight": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.119.up_proj.weight_scale": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.12.down_proj.weight": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.12.down_proj.weight_scale": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.12.gate_proj.weight": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.12.gate_proj.weight_scale": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.12.up_proj.weight": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.12.up_proj.weight_scale": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.120.down_proj.weight": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.120.down_proj.weight_scale": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.120.gate_proj.weight": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.120.gate_proj.weight_scale": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.120.up_proj.weight": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.120.up_proj.weight_scale": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.121.down_proj.weight": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.121.down_proj.weight_scale": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.121.gate_proj.weight": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.121.gate_proj.weight_scale": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.121.up_proj.weight": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.121.up_proj.weight_scale": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.122.down_proj.weight": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.122.down_proj.weight_scale": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.122.gate_proj.weight": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.122.gate_proj.weight_scale": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.122.up_proj.weight": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.122.up_proj.weight_scale": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.123.down_proj.weight": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.123.down_proj.weight_scale": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.123.gate_proj.weight": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.123.gate_proj.weight_scale": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.123.up_proj.weight": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.123.up_proj.weight_scale": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.124.down_proj.weight": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.124.down_proj.weight_scale": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.124.gate_proj.weight": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.124.gate_proj.weight_scale": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.124.up_proj.weight": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.124.up_proj.weight_scale": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.125.down_proj.weight": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.125.down_proj.weight_scale": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.125.gate_proj.weight": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.125.gate_proj.weight_scale": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.125.up_proj.weight": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.125.up_proj.weight_scale": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.126.down_proj.weight": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.126.down_proj.weight_scale": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.126.gate_proj.weight": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.126.gate_proj.weight_scale": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.126.up_proj.weight": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.126.up_proj.weight_scale": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.127.down_proj.weight": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.127.down_proj.weight_scale": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.127.gate_proj.weight": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.127.gate_proj.weight_scale": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.127.up_proj.weight": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.127.up_proj.weight_scale": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.128.down_proj.weight": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.128.down_proj.weight_scale": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.128.gate_proj.weight": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.128.gate_proj.weight_scale": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.128.up_proj.weight": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.128.up_proj.weight_scale": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.129.down_proj.weight": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.129.down_proj.weight_scale": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.129.gate_proj.weight": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.129.gate_proj.weight_scale": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.129.up_proj.weight": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.129.up_proj.weight_scale": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.13.down_proj.weight": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.13.down_proj.weight_scale": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.13.gate_proj.weight": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.13.gate_proj.weight_scale": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.13.up_proj.weight": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.13.up_proj.weight_scale": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.130.down_proj.weight": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.130.down_proj.weight_scale": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.130.gate_proj.weight": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.130.gate_proj.weight_scale": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.130.up_proj.weight": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.130.up_proj.weight_scale": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.131.down_proj.weight": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.131.down_proj.weight_scale": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.131.gate_proj.weight": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.131.gate_proj.weight_scale": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.131.up_proj.weight": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.131.up_proj.weight_scale": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.132.down_proj.weight": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.132.down_proj.weight_scale": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.132.gate_proj.weight": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.132.gate_proj.weight_scale": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.132.up_proj.weight": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.132.up_proj.weight_scale": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.133.down_proj.weight": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.133.down_proj.weight_scale": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.133.gate_proj.weight": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.133.gate_proj.weight_scale": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.133.up_proj.weight": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.133.up_proj.weight_scale": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.134.down_proj.weight": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.134.down_proj.weight_scale": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.134.gate_proj.weight": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.134.gate_proj.weight_scale": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.134.up_proj.weight": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.134.up_proj.weight_scale": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.135.down_proj.weight": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.135.down_proj.weight_scale": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.135.gate_proj.weight": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.135.gate_proj.weight_scale": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.135.up_proj.weight": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.135.up_proj.weight_scale": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.136.down_proj.weight": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.136.down_proj.weight_scale": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.136.gate_proj.weight": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.136.gate_proj.weight_scale": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.136.up_proj.weight": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.136.up_proj.weight_scale": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.137.down_proj.weight": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.137.down_proj.weight_scale": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.137.gate_proj.weight": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.137.gate_proj.weight_scale": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.137.up_proj.weight": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.137.up_proj.weight_scale": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.138.down_proj.weight": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.138.down_proj.weight_scale": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.138.gate_proj.weight": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.138.gate_proj.weight_scale": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.138.up_proj.weight": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.138.up_proj.weight_scale": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.139.down_proj.weight": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.139.down_proj.weight_scale": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.139.gate_proj.weight": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.139.gate_proj.weight_scale": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.139.up_proj.weight": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.139.up_proj.weight_scale": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.14.down_proj.weight": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.14.down_proj.weight_scale": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.14.gate_proj.weight": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.14.gate_proj.weight_scale": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.14.up_proj.weight": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.14.up_proj.weight_scale": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.140.down_proj.weight": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.140.down_proj.weight_scale": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.140.gate_proj.weight": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.140.gate_proj.weight_scale": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.140.up_proj.weight": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.140.up_proj.weight_scale": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.141.down_proj.weight": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.141.down_proj.weight_scale": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.141.gate_proj.weight": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.141.gate_proj.weight_scale": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.141.up_proj.weight": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.141.up_proj.weight_scale": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.142.down_proj.weight": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.142.down_proj.weight_scale": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.142.gate_proj.weight": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.142.gate_proj.weight_scale": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.142.up_proj.weight": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.142.up_proj.weight_scale": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.143.down_proj.weight": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.143.down_proj.weight_scale": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.143.gate_proj.weight": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.143.gate_proj.weight_scale": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.143.up_proj.weight": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.143.up_proj.weight_scale": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.144.down_proj.weight": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.144.down_proj.weight_scale": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.144.gate_proj.weight": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.144.gate_proj.weight_scale": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.144.up_proj.weight": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.144.up_proj.weight_scale": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.145.down_proj.weight": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.145.down_proj.weight_scale": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.145.gate_proj.weight": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.145.gate_proj.weight_scale": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.145.up_proj.weight": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.145.up_proj.weight_scale": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.146.down_proj.weight": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.146.down_proj.weight_scale": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.146.gate_proj.weight": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.146.gate_proj.weight_scale": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.146.up_proj.weight": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.146.up_proj.weight_scale": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.147.down_proj.weight": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.147.down_proj.weight_scale": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.147.gate_proj.weight": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.147.gate_proj.weight_scale": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.147.up_proj.weight": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.147.up_proj.weight_scale": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.148.down_proj.weight": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.148.down_proj.weight_scale": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.148.gate_proj.weight": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.148.gate_proj.weight_scale": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.148.up_proj.weight": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.148.up_proj.weight_scale": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.149.down_proj.weight": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.149.down_proj.weight_scale": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.149.gate_proj.weight": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.149.gate_proj.weight_scale": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.149.up_proj.weight": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.149.up_proj.weight_scale": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.15.down_proj.weight": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.15.down_proj.weight_scale": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.15.gate_proj.weight": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.15.gate_proj.weight_scale": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.15.up_proj.weight": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.15.up_proj.weight_scale": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.150.down_proj.weight": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.150.down_proj.weight_scale": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.150.gate_proj.weight": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.150.gate_proj.weight_scale": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.150.up_proj.weight": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.150.up_proj.weight_scale": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.151.down_proj.weight": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.151.down_proj.weight_scale": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.151.gate_proj.weight": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.151.gate_proj.weight_scale": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.151.up_proj.weight": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.151.up_proj.weight_scale": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.152.down_proj.weight": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.152.down_proj.weight_scale": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.152.gate_proj.weight": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.152.gate_proj.weight_scale": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.152.up_proj.weight": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.152.up_proj.weight_scale": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.153.down_proj.weight": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.153.down_proj.weight_scale": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.153.gate_proj.weight": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.153.gate_proj.weight_scale": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.153.up_proj.weight": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.153.up_proj.weight_scale": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.154.down_proj.weight": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.154.down_proj.weight_scale": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.154.gate_proj.weight": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.154.gate_proj.weight_scale": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.154.up_proj.weight": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.154.up_proj.weight_scale": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.155.down_proj.weight": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.155.down_proj.weight_scale": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.155.gate_proj.weight": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.155.gate_proj.weight_scale": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.155.up_proj.weight": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.155.up_proj.weight_scale": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.156.down_proj.weight": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.156.down_proj.weight_scale": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.156.gate_proj.weight": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.156.gate_proj.weight_scale": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.156.up_proj.weight": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.156.up_proj.weight_scale": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.157.down_proj.weight": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.157.down_proj.weight_scale": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.157.gate_proj.weight": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.157.gate_proj.weight_scale": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.157.up_proj.weight": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.157.up_proj.weight_scale": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.158.down_proj.weight": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.158.down_proj.weight_scale": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.158.gate_proj.weight": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.158.gate_proj.weight_scale": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.158.up_proj.weight": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.158.up_proj.weight_scale": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.159.down_proj.weight": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.159.down_proj.weight_scale": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.159.gate_proj.weight": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.159.gate_proj.weight_scale": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.159.up_proj.weight": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.159.up_proj.weight_scale": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.16.down_proj.weight": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.16.down_proj.weight_scale": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.16.gate_proj.weight": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.16.gate_proj.weight_scale": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.16.up_proj.weight": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.16.up_proj.weight_scale": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.17.down_proj.weight": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.17.down_proj.weight_scale": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.17.gate_proj.weight": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.17.gate_proj.weight_scale": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.17.up_proj.weight": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.17.up_proj.weight_scale": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.18.down_proj.weight": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.18.down_proj.weight_scale": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.18.gate_proj.weight": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.18.gate_proj.weight_scale": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.18.up_proj.weight": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.18.up_proj.weight_scale": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.19.down_proj.weight": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.19.down_proj.weight_scale": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.19.gate_proj.weight": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.19.gate_proj.weight_scale": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.19.up_proj.weight": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.19.up_proj.weight_scale": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.2.down_proj.weight": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.2.down_proj.weight_scale": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.2.gate_proj.weight": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.2.gate_proj.weight_scale": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.2.up_proj.weight": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.2.up_proj.weight_scale": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.20.down_proj.weight": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.20.down_proj.weight_scale": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.20.gate_proj.weight": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.20.gate_proj.weight_scale": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.20.up_proj.weight": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.20.up_proj.weight_scale": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.21.down_proj.weight": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.21.down_proj.weight_scale": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.21.gate_proj.weight": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.21.gate_proj.weight_scale": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.21.up_proj.weight": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.21.up_proj.weight_scale": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.22.down_proj.weight": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.22.down_proj.weight_scale": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.22.gate_proj.weight": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.22.gate_proj.weight_scale": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.22.up_proj.weight": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.22.up_proj.weight_scale": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.23.down_proj.weight": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.23.down_proj.weight_scale": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.23.gate_proj.weight": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.23.gate_proj.weight_scale": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.23.up_proj.weight": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.23.up_proj.weight_scale": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.24.down_proj.weight": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.24.down_proj.weight_scale": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.24.gate_proj.weight": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.24.gate_proj.weight_scale": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.24.up_proj.weight": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.24.up_proj.weight_scale": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.25.down_proj.weight": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.25.down_proj.weight_scale": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.25.gate_proj.weight": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.25.gate_proj.weight_scale": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.25.up_proj.weight": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.25.up_proj.weight_scale": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.26.down_proj.weight": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.26.down_proj.weight_scale": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.26.gate_proj.weight": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.26.gate_proj.weight_scale": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.26.up_proj.weight": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.26.up_proj.weight_scale": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.27.down_proj.weight": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.27.down_proj.weight_scale": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.27.gate_proj.weight": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.27.gate_proj.weight_scale": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.27.up_proj.weight": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.27.up_proj.weight_scale": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.28.down_proj.weight": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.28.down_proj.weight_scale": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.28.gate_proj.weight": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.28.gate_proj.weight_scale": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.28.up_proj.weight": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.28.up_proj.weight_scale": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.29.down_proj.weight": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.29.down_proj.weight_scale": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.29.gate_proj.weight": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.29.gate_proj.weight_scale": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.29.up_proj.weight": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.29.up_proj.weight_scale": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.3.down_proj.weight": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.3.down_proj.weight_scale": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.3.gate_proj.weight": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.3.gate_proj.weight_scale": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.3.up_proj.weight": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.3.up_proj.weight_scale": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.30.down_proj.weight": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.30.down_proj.weight_scale": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.30.gate_proj.weight": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.30.gate_proj.weight_scale": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.30.up_proj.weight": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.30.up_proj.weight_scale": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.31.down_proj.weight": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.31.down_proj.weight_scale": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.31.gate_proj.weight": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.31.gate_proj.weight_scale": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.31.up_proj.weight": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.31.up_proj.weight_scale": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.32.down_proj.weight": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.32.down_proj.weight_scale": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.32.gate_proj.weight": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.32.gate_proj.weight_scale": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.32.up_proj.weight": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.32.up_proj.weight_scale": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.33.down_proj.weight": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.33.down_proj.weight_scale": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.33.gate_proj.weight": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.33.gate_proj.weight_scale": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.33.up_proj.weight": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.33.up_proj.weight_scale": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.34.down_proj.weight": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.34.down_proj.weight_scale": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.34.gate_proj.weight": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.34.gate_proj.weight_scale": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.34.up_proj.weight": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.34.up_proj.weight_scale": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.35.down_proj.weight": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.35.down_proj.weight_scale": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.35.gate_proj.weight": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.35.gate_proj.weight_scale": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.35.up_proj.weight": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.35.up_proj.weight_scale": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.36.down_proj.weight": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.36.down_proj.weight_scale": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.36.gate_proj.weight": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.36.gate_proj.weight_scale": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.36.up_proj.weight": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.36.up_proj.weight_scale": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.37.down_proj.weight": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.37.down_proj.weight_scale": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.37.gate_proj.weight": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.37.gate_proj.weight_scale": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.37.up_proj.weight": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.37.up_proj.weight_scale": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.38.down_proj.weight": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.38.down_proj.weight_scale": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.38.gate_proj.weight": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.38.gate_proj.weight_scale": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.38.up_proj.weight": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.38.up_proj.weight_scale": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.39.down_proj.weight": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.39.down_proj.weight_scale": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.39.gate_proj.weight": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.39.gate_proj.weight_scale": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.39.up_proj.weight": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.39.up_proj.weight_scale": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.4.down_proj.weight": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.4.down_proj.weight_scale": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.4.gate_proj.weight": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.4.gate_proj.weight_scale": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.4.up_proj.weight": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.4.up_proj.weight_scale": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.40.down_proj.weight": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.40.down_proj.weight_scale": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.40.gate_proj.weight": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.40.gate_proj.weight_scale": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.40.up_proj.weight": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.40.up_proj.weight_scale": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.41.down_proj.weight": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.41.down_proj.weight_scale": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.41.gate_proj.weight": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.41.gate_proj.weight_scale": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.41.up_proj.weight": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.41.up_proj.weight_scale": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.42.down_proj.weight": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.42.down_proj.weight_scale": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.42.gate_proj.weight": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.42.gate_proj.weight_scale": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.42.up_proj.weight": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.42.up_proj.weight_scale": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.43.down_proj.weight": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.43.down_proj.weight_scale": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.43.gate_proj.weight": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.43.gate_proj.weight_scale": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.43.up_proj.weight": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.43.up_proj.weight_scale": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.44.down_proj.weight": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.44.down_proj.weight_scale": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.44.gate_proj.weight": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.44.gate_proj.weight_scale": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.44.up_proj.weight": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.44.up_proj.weight_scale": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.45.down_proj.weight": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.45.down_proj.weight_scale": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.45.gate_proj.weight": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.45.gate_proj.weight_scale": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.45.up_proj.weight": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.45.up_proj.weight_scale": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.46.down_proj.weight": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.46.down_proj.weight_scale": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.46.gate_proj.weight": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.46.gate_proj.weight_scale": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.46.up_proj.weight": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.46.up_proj.weight_scale": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.47.down_proj.weight": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.47.down_proj.weight_scale": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.47.gate_proj.weight": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.47.gate_proj.weight_scale": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.47.up_proj.weight": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.47.up_proj.weight_scale": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.48.down_proj.weight": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.48.down_proj.weight_scale": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.48.gate_proj.weight": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.48.gate_proj.weight_scale": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.48.up_proj.weight": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.48.up_proj.weight_scale": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.49.down_proj.weight": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.49.down_proj.weight_scale": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.49.gate_proj.weight": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.49.gate_proj.weight_scale": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.49.up_proj.weight": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.49.up_proj.weight_scale": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.5.down_proj.weight": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.5.down_proj.weight_scale": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.5.gate_proj.weight": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.5.gate_proj.weight_scale": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.5.up_proj.weight": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.5.up_proj.weight_scale": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.50.down_proj.weight": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.50.down_proj.weight_scale": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.50.gate_proj.weight": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.50.gate_proj.weight_scale": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.50.up_proj.weight": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.50.up_proj.weight_scale": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.51.down_proj.weight": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.51.down_proj.weight_scale": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.51.gate_proj.weight": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.51.gate_proj.weight_scale": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.51.up_proj.weight": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.51.up_proj.weight_scale": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.52.down_proj.weight": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.52.down_proj.weight_scale": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.52.gate_proj.weight": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.52.gate_proj.weight_scale": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.52.up_proj.weight": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.52.up_proj.weight_scale": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.53.down_proj.weight": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.53.down_proj.weight_scale": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.53.gate_proj.weight": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.53.gate_proj.weight_scale": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.53.up_proj.weight": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.53.up_proj.weight_scale": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.54.down_proj.weight": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.54.down_proj.weight_scale": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.54.gate_proj.weight": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.54.gate_proj.weight_scale": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.54.up_proj.weight": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.54.up_proj.weight_scale": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.55.down_proj.weight": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.55.down_proj.weight_scale": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.55.gate_proj.weight": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.55.gate_proj.weight_scale": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.55.up_proj.weight": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.55.up_proj.weight_scale": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.56.down_proj.weight": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.56.down_proj.weight_scale": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.56.gate_proj.weight": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.56.gate_proj.weight_scale": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.56.up_proj.weight": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.56.up_proj.weight_scale": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.57.down_proj.weight": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.57.down_proj.weight_scale": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.57.gate_proj.weight": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.57.gate_proj.weight_scale": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.57.up_proj.weight": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.57.up_proj.weight_scale": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.58.down_proj.weight": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.58.down_proj.weight_scale": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.58.gate_proj.weight": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.58.gate_proj.weight_scale": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.58.up_proj.weight": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.58.up_proj.weight_scale": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.59.down_proj.weight": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.59.down_proj.weight_scale": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.59.gate_proj.weight": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.59.gate_proj.weight_scale": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.59.up_proj.weight": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.59.up_proj.weight_scale": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.6.down_proj.weight": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.6.down_proj.weight_scale": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.6.gate_proj.weight": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.6.gate_proj.weight_scale": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.6.up_proj.weight": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.6.up_proj.weight_scale": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.60.down_proj.weight": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.60.down_proj.weight_scale": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.60.gate_proj.weight": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.60.gate_proj.weight_scale": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.60.up_proj.weight": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.60.up_proj.weight_scale": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.61.down_proj.weight": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.61.down_proj.weight_scale": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.61.gate_proj.weight": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.61.gate_proj.weight_scale": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.61.up_proj.weight": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.61.up_proj.weight_scale": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.62.down_proj.weight": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.62.down_proj.weight_scale": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.62.gate_proj.weight": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.62.gate_proj.weight_scale": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.62.up_proj.weight": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.62.up_proj.weight_scale": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.63.down_proj.weight": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.63.down_proj.weight_scale": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.63.gate_proj.weight": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.63.gate_proj.weight_scale": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.63.up_proj.weight": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.63.up_proj.weight_scale": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.64.down_proj.weight": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.64.down_proj.weight_scale": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.64.gate_proj.weight": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.64.gate_proj.weight_scale": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.64.up_proj.weight": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.64.up_proj.weight_scale": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.65.down_proj.weight": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.65.down_proj.weight_scale": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.65.gate_proj.weight": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.65.gate_proj.weight_scale": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.65.up_proj.weight": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.65.up_proj.weight_scale": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.66.down_proj.weight": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.66.down_proj.weight_scale": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.66.gate_proj.weight": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.66.gate_proj.weight_scale": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.66.up_proj.weight": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.66.up_proj.weight_scale": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.67.down_proj.weight": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.67.down_proj.weight_scale": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.67.gate_proj.weight": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.67.gate_proj.weight_scale": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.67.up_proj.weight": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.67.up_proj.weight_scale": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.68.down_proj.weight": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.68.down_proj.weight_scale": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.68.gate_proj.weight": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.68.gate_proj.weight_scale": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.68.up_proj.weight": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.68.up_proj.weight_scale": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.69.down_proj.weight": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.69.down_proj.weight_scale": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.69.gate_proj.weight": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.69.gate_proj.weight_scale": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.69.up_proj.weight": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.69.up_proj.weight_scale": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.7.down_proj.weight": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.7.down_proj.weight_scale": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.7.gate_proj.weight": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.7.gate_proj.weight_scale": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.7.up_proj.weight": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.7.up_proj.weight_scale": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.70.down_proj.weight": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.70.down_proj.weight_scale": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.70.gate_proj.weight": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.70.gate_proj.weight_scale": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.70.up_proj.weight": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.70.up_proj.weight_scale": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.71.down_proj.weight": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.71.down_proj.weight_scale": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.71.gate_proj.weight": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.71.gate_proj.weight_scale": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.71.up_proj.weight": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.71.up_proj.weight_scale": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.72.down_proj.weight": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.72.down_proj.weight_scale": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.72.gate_proj.weight": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.72.gate_proj.weight_scale": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.72.up_proj.weight": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.72.up_proj.weight_scale": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.73.down_proj.weight": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.73.down_proj.weight_scale": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.73.gate_proj.weight": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.73.gate_proj.weight_scale": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.73.up_proj.weight": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.73.up_proj.weight_scale": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.74.down_proj.weight": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.74.down_proj.weight_scale": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.74.gate_proj.weight": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.74.gate_proj.weight_scale": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.74.up_proj.weight": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.74.up_proj.weight_scale": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.75.down_proj.weight": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.75.down_proj.weight_scale": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.75.gate_proj.weight": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.75.gate_proj.weight_scale": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.75.up_proj.weight": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.75.up_proj.weight_scale": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.76.down_proj.weight": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.76.down_proj.weight_scale": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.76.gate_proj.weight": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.76.gate_proj.weight_scale": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.76.up_proj.weight": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.76.up_proj.weight_scale": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.77.down_proj.weight": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.77.down_proj.weight_scale": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.77.gate_proj.weight": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.77.gate_proj.weight_scale": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.77.up_proj.weight": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.77.up_proj.weight_scale": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.78.down_proj.weight": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.78.down_proj.weight_scale": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.78.gate_proj.weight": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.78.gate_proj.weight_scale": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.78.up_proj.weight": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.78.up_proj.weight_scale": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.79.down_proj.weight": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.79.down_proj.weight_scale": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.79.gate_proj.weight": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.79.gate_proj.weight_scale": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.79.up_proj.weight": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.79.up_proj.weight_scale": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.8.down_proj.weight": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.8.down_proj.weight_scale": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.8.gate_proj.weight": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.8.gate_proj.weight_scale": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.8.up_proj.weight": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.8.up_proj.weight_scale": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.80.down_proj.weight": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.80.down_proj.weight_scale": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.80.gate_proj.weight": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.80.gate_proj.weight_scale": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.80.up_proj.weight": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.80.up_proj.weight_scale": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.81.down_proj.weight": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.81.down_proj.weight_scale": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.81.gate_proj.weight": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.81.gate_proj.weight_scale": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.81.up_proj.weight": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.81.up_proj.weight_scale": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.82.down_proj.weight": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.82.down_proj.weight_scale": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.82.gate_proj.weight": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.82.gate_proj.weight_scale": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.82.up_proj.weight": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.82.up_proj.weight_scale": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.83.down_proj.weight": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.83.down_proj.weight_scale": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.83.gate_proj.weight": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.83.gate_proj.weight_scale": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.83.up_proj.weight": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.83.up_proj.weight_scale": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.84.down_proj.weight": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.84.down_proj.weight_scale": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.84.gate_proj.weight": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.84.gate_proj.weight_scale": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.84.up_proj.weight": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.84.up_proj.weight_scale": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.85.down_proj.weight": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.85.down_proj.weight_scale": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.85.gate_proj.weight": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.85.gate_proj.weight_scale": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.85.up_proj.weight": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.85.up_proj.weight_scale": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.86.down_proj.weight": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.86.down_proj.weight_scale": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.86.gate_proj.weight": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.86.gate_proj.weight_scale": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.86.up_proj.weight": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.86.up_proj.weight_scale": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.87.down_proj.weight": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.87.down_proj.weight_scale": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.87.gate_proj.weight": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.87.gate_proj.weight_scale": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.87.up_proj.weight": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.87.up_proj.weight_scale": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.88.down_proj.weight": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.88.down_proj.weight_scale": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.88.gate_proj.weight": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.88.gate_proj.weight_scale": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.88.up_proj.weight": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.88.up_proj.weight_scale": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.89.down_proj.weight": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.89.down_proj.weight_scale": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.89.gate_proj.weight": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.89.gate_proj.weight_scale": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.89.up_proj.weight": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.89.up_proj.weight_scale": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.9.down_proj.weight": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.9.down_proj.weight_scale": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.9.gate_proj.weight": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.9.gate_proj.weight_scale": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.9.up_proj.weight": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.9.up_proj.weight_scale": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.90.down_proj.weight": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.90.down_proj.weight_scale": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.90.gate_proj.weight": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.90.gate_proj.weight_scale": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.90.up_proj.weight": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.90.up_proj.weight_scale": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.91.down_proj.weight": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.91.down_proj.weight_scale": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.91.gate_proj.weight": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.91.gate_proj.weight_scale": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.91.up_proj.weight": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.91.up_proj.weight_scale": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.92.down_proj.weight": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.92.down_proj.weight_scale": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.92.gate_proj.weight": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.92.gate_proj.weight_scale": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.92.up_proj.weight": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.92.up_proj.weight_scale": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.93.down_proj.weight": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.93.down_proj.weight_scale": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.93.gate_proj.weight": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.93.gate_proj.weight_scale": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.93.up_proj.weight": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.93.up_proj.weight_scale": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.94.down_proj.weight": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.94.down_proj.weight_scale": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.94.gate_proj.weight": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.94.gate_proj.weight_scale": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.94.up_proj.weight": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.94.up_proj.weight_scale": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.95.down_proj.weight": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.95.down_proj.weight_scale": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.95.gate_proj.weight": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.95.gate_proj.weight_scale": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.95.up_proj.weight": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.95.up_proj.weight_scale": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.96.down_proj.weight": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.96.down_proj.weight_scale": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.96.gate_proj.weight": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.96.gate_proj.weight_scale": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.96.up_proj.weight": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.96.up_proj.weight_scale": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.97.down_proj.weight": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.97.down_proj.weight_scale": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.97.gate_proj.weight": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.97.gate_proj.weight_scale": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.97.up_proj.weight": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.97.up_proj.weight_scale": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.98.down_proj.weight": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.98.down_proj.weight_scale": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.98.gate_proj.weight": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.98.gate_proj.weight_scale": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.98.up_proj.weight": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.98.up_proj.weight_scale": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.99.down_proj.weight": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.99.down_proj.weight_scale": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.99.gate_proj.weight": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.99.gate_proj.weight_scale": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.99.up_proj.weight": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.99.up_proj.weight_scale": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.gate.e_score_correction_bias": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.gate.weight": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.shared_experts.down_proj.weight": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.shared_experts.down_proj.weight_scale": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.shared_experts.gate_proj.weight": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.shared_experts.gate_proj.weight_scale": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.shared_experts.up_proj.weight": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.shared_experts.up_proj.weight_scale": "model-00023-of-00092.safetensors",
+ "model.layers.22.post_attention_layernorm.weight": "model-00023-of-00092.safetensors",
+ "model.layers.22.self_attn.k_norm.weight": "model-00023-of-00092.safetensors",
+ "model.layers.22.self_attn.k_proj.bias": "model-00023-of-00092.safetensors",
+ "model.layers.22.self_attn.k_proj.weight": "model-00023-of-00092.safetensors",
+ "model.layers.22.self_attn.k_proj.weight_scale": "model-00023-of-00092.safetensors",
+ "model.layers.22.self_attn.o_proj.weight": "model-00023-of-00092.safetensors",
+ "model.layers.22.self_attn.o_proj.weight_scale": "model-00023-of-00092.safetensors",
+ "model.layers.22.self_attn.q_norm.weight": "model-00023-of-00092.safetensors",
+ "model.layers.22.self_attn.q_proj.bias": "model-00023-of-00092.safetensors",
+ "model.layers.22.self_attn.q_proj.weight": "model-00023-of-00092.safetensors",
+ "model.layers.22.self_attn.q_proj.weight_scale": "model-00023-of-00092.safetensors",
+ "model.layers.22.self_attn.v_proj.bias": "model-00023-of-00092.safetensors",
+ "model.layers.22.self_attn.v_proj.weight": "model-00023-of-00092.safetensors",
+ "model.layers.22.self_attn.v_proj.weight_scale": "model-00023-of-00092.safetensors",
+ "model.layers.23.input_layernorm.weight": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.0.down_proj.weight": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.0.down_proj.weight_scale": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.0.gate_proj.weight": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.0.gate_proj.weight_scale": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.0.up_proj.weight": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.0.up_proj.weight_scale": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.1.down_proj.weight": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.1.down_proj.weight_scale": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.1.gate_proj.weight": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.1.gate_proj.weight_scale": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.1.up_proj.weight": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.1.up_proj.weight_scale": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.10.down_proj.weight": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.10.down_proj.weight_scale": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.10.gate_proj.weight": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.10.gate_proj.weight_scale": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.10.up_proj.weight": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.10.up_proj.weight_scale": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.100.down_proj.weight": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.100.down_proj.weight_scale": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.100.gate_proj.weight": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.100.gate_proj.weight_scale": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.100.up_proj.weight": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.100.up_proj.weight_scale": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.101.down_proj.weight": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.101.down_proj.weight_scale": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.101.gate_proj.weight": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.101.gate_proj.weight_scale": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.101.up_proj.weight": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.101.up_proj.weight_scale": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.102.down_proj.weight": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.102.down_proj.weight_scale": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.102.gate_proj.weight": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.102.gate_proj.weight_scale": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.102.up_proj.weight": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.102.up_proj.weight_scale": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.103.down_proj.weight": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.103.down_proj.weight_scale": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.103.gate_proj.weight": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.103.gate_proj.weight_scale": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.103.up_proj.weight": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.103.up_proj.weight_scale": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.104.down_proj.weight": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.104.down_proj.weight_scale": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.104.gate_proj.weight": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.104.gate_proj.weight_scale": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.104.up_proj.weight": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.104.up_proj.weight_scale": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.105.down_proj.weight": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.105.down_proj.weight_scale": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.105.gate_proj.weight": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.105.gate_proj.weight_scale": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.105.up_proj.weight": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.105.up_proj.weight_scale": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.106.down_proj.weight": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.106.down_proj.weight_scale": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.106.gate_proj.weight": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.106.gate_proj.weight_scale": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.106.up_proj.weight": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.106.up_proj.weight_scale": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.107.down_proj.weight": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.107.down_proj.weight_scale": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.107.gate_proj.weight": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.107.gate_proj.weight_scale": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.107.up_proj.weight": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.107.up_proj.weight_scale": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.108.down_proj.weight": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.108.down_proj.weight_scale": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.108.gate_proj.weight": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.108.gate_proj.weight_scale": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.108.up_proj.weight": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.108.up_proj.weight_scale": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.109.down_proj.weight": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.109.down_proj.weight_scale": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.109.gate_proj.weight": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.109.gate_proj.weight_scale": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.109.up_proj.weight": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.109.up_proj.weight_scale": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.11.down_proj.weight": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.11.down_proj.weight_scale": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.11.gate_proj.weight": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.11.gate_proj.weight_scale": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.11.up_proj.weight": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.11.up_proj.weight_scale": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.110.down_proj.weight": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.110.down_proj.weight_scale": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.110.gate_proj.weight": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.110.gate_proj.weight_scale": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.110.up_proj.weight": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.110.up_proj.weight_scale": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.111.down_proj.weight": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.111.down_proj.weight_scale": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.111.gate_proj.weight": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.111.gate_proj.weight_scale": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.111.up_proj.weight": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.111.up_proj.weight_scale": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.112.down_proj.weight": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.112.down_proj.weight_scale": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.112.gate_proj.weight": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.112.gate_proj.weight_scale": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.112.up_proj.weight": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.112.up_proj.weight_scale": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.113.down_proj.weight": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.113.down_proj.weight_scale": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.113.gate_proj.weight": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.113.gate_proj.weight_scale": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.113.up_proj.weight": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.113.up_proj.weight_scale": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.114.down_proj.weight": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.114.down_proj.weight_scale": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.114.gate_proj.weight": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.114.gate_proj.weight_scale": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.114.up_proj.weight": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.114.up_proj.weight_scale": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.115.down_proj.weight": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.115.down_proj.weight_scale": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.115.gate_proj.weight": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.115.gate_proj.weight_scale": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.115.up_proj.weight": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.115.up_proj.weight_scale": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.116.down_proj.weight": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.116.down_proj.weight_scale": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.116.gate_proj.weight": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.116.gate_proj.weight_scale": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.116.up_proj.weight": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.116.up_proj.weight_scale": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.117.down_proj.weight": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.117.down_proj.weight_scale": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.117.gate_proj.weight": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.117.gate_proj.weight_scale": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.117.up_proj.weight": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.117.up_proj.weight_scale": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.118.down_proj.weight": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.118.down_proj.weight_scale": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.118.gate_proj.weight": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.118.gate_proj.weight_scale": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.118.up_proj.weight": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.118.up_proj.weight_scale": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.119.down_proj.weight": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.119.down_proj.weight_scale": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.119.gate_proj.weight": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.119.gate_proj.weight_scale": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.119.up_proj.weight": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.119.up_proj.weight_scale": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.12.down_proj.weight": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.12.down_proj.weight_scale": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.12.gate_proj.weight": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.12.gate_proj.weight_scale": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.12.up_proj.weight": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.12.up_proj.weight_scale": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.120.down_proj.weight": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.120.down_proj.weight_scale": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.120.gate_proj.weight": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.120.gate_proj.weight_scale": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.120.up_proj.weight": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.120.up_proj.weight_scale": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.121.down_proj.weight": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.121.down_proj.weight_scale": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.121.gate_proj.weight": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.121.gate_proj.weight_scale": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.121.up_proj.weight": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.121.up_proj.weight_scale": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.122.down_proj.weight": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.122.down_proj.weight_scale": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.122.gate_proj.weight": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.122.gate_proj.weight_scale": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.122.up_proj.weight": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.122.up_proj.weight_scale": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.123.down_proj.weight": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.123.down_proj.weight_scale": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.123.gate_proj.weight": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.123.gate_proj.weight_scale": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.123.up_proj.weight": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.123.up_proj.weight_scale": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.124.down_proj.weight": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.124.down_proj.weight_scale": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.124.gate_proj.weight": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.124.gate_proj.weight_scale": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.124.up_proj.weight": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.124.up_proj.weight_scale": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.125.down_proj.weight": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.125.down_proj.weight_scale": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.125.gate_proj.weight": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.125.gate_proj.weight_scale": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.125.up_proj.weight": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.125.up_proj.weight_scale": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.126.down_proj.weight": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.126.down_proj.weight_scale": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.126.gate_proj.weight": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.126.gate_proj.weight_scale": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.126.up_proj.weight": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.126.up_proj.weight_scale": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.127.down_proj.weight": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.127.down_proj.weight_scale": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.127.gate_proj.weight": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.127.gate_proj.weight_scale": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.127.up_proj.weight": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.127.up_proj.weight_scale": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.128.down_proj.weight": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.128.down_proj.weight_scale": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.128.gate_proj.weight": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.128.gate_proj.weight_scale": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.128.up_proj.weight": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.128.up_proj.weight_scale": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.129.down_proj.weight": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.129.down_proj.weight_scale": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.129.gate_proj.weight": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.129.gate_proj.weight_scale": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.129.up_proj.weight": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.129.up_proj.weight_scale": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.13.down_proj.weight": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.13.down_proj.weight_scale": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.13.gate_proj.weight": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.13.gate_proj.weight_scale": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.13.up_proj.weight": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.13.up_proj.weight_scale": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.130.down_proj.weight": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.130.down_proj.weight_scale": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.130.gate_proj.weight": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.130.gate_proj.weight_scale": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.130.up_proj.weight": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.130.up_proj.weight_scale": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.131.down_proj.weight": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.131.down_proj.weight_scale": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.131.gate_proj.weight": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.131.gate_proj.weight_scale": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.131.up_proj.weight": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.131.up_proj.weight_scale": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.132.down_proj.weight": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.132.down_proj.weight_scale": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.132.gate_proj.weight": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.132.gate_proj.weight_scale": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.132.up_proj.weight": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.132.up_proj.weight_scale": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.133.down_proj.weight": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.133.down_proj.weight_scale": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.133.gate_proj.weight": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.133.gate_proj.weight_scale": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.133.up_proj.weight": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.133.up_proj.weight_scale": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.134.down_proj.weight": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.134.down_proj.weight_scale": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.134.gate_proj.weight": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.134.gate_proj.weight_scale": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.134.up_proj.weight": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.134.up_proj.weight_scale": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.135.down_proj.weight": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.135.down_proj.weight_scale": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.135.gate_proj.weight": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.135.gate_proj.weight_scale": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.135.up_proj.weight": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.135.up_proj.weight_scale": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.136.down_proj.weight": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.136.down_proj.weight_scale": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.136.gate_proj.weight": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.136.gate_proj.weight_scale": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.136.up_proj.weight": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.136.up_proj.weight_scale": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.137.down_proj.weight": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.137.down_proj.weight_scale": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.137.gate_proj.weight": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.137.gate_proj.weight_scale": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.137.up_proj.weight": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.137.up_proj.weight_scale": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.138.down_proj.weight": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.138.down_proj.weight_scale": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.138.gate_proj.weight": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.138.gate_proj.weight_scale": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.138.up_proj.weight": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.138.up_proj.weight_scale": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.139.down_proj.weight": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.139.down_proj.weight_scale": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.139.gate_proj.weight": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.139.gate_proj.weight_scale": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.139.up_proj.weight": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.139.up_proj.weight_scale": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.14.down_proj.weight": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.14.down_proj.weight_scale": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.14.gate_proj.weight": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.14.gate_proj.weight_scale": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.14.up_proj.weight": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.14.up_proj.weight_scale": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.140.down_proj.weight": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.140.down_proj.weight_scale": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.140.gate_proj.weight": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.140.gate_proj.weight_scale": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.140.up_proj.weight": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.140.up_proj.weight_scale": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.141.down_proj.weight": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.141.down_proj.weight_scale": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.141.gate_proj.weight": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.141.gate_proj.weight_scale": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.141.up_proj.weight": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.141.up_proj.weight_scale": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.142.down_proj.weight": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.142.down_proj.weight_scale": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.142.gate_proj.weight": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.142.gate_proj.weight_scale": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.142.up_proj.weight": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.142.up_proj.weight_scale": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.143.down_proj.weight": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.143.down_proj.weight_scale": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.143.gate_proj.weight": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.143.gate_proj.weight_scale": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.143.up_proj.weight": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.143.up_proj.weight_scale": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.144.down_proj.weight": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.144.down_proj.weight_scale": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.144.gate_proj.weight": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.144.gate_proj.weight_scale": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.144.up_proj.weight": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.144.up_proj.weight_scale": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.145.down_proj.weight": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.145.down_proj.weight_scale": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.145.gate_proj.weight": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.145.gate_proj.weight_scale": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.145.up_proj.weight": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.145.up_proj.weight_scale": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.146.down_proj.weight": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.146.down_proj.weight_scale": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.146.gate_proj.weight": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.146.gate_proj.weight_scale": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.146.up_proj.weight": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.146.up_proj.weight_scale": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.147.down_proj.weight": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.147.down_proj.weight_scale": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.147.gate_proj.weight": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.147.gate_proj.weight_scale": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.147.up_proj.weight": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.147.up_proj.weight_scale": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.148.down_proj.weight": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.148.down_proj.weight_scale": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.148.gate_proj.weight": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.148.gate_proj.weight_scale": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.148.up_proj.weight": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.148.up_proj.weight_scale": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.149.down_proj.weight": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.149.down_proj.weight_scale": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.149.gate_proj.weight": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.149.gate_proj.weight_scale": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.149.up_proj.weight": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.149.up_proj.weight_scale": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.15.down_proj.weight": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.15.down_proj.weight_scale": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.15.gate_proj.weight": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.15.gate_proj.weight_scale": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.15.up_proj.weight": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.15.up_proj.weight_scale": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.150.down_proj.weight": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.150.down_proj.weight_scale": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.150.gate_proj.weight": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.150.gate_proj.weight_scale": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.150.up_proj.weight": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.150.up_proj.weight_scale": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.151.down_proj.weight": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.151.down_proj.weight_scale": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.151.gate_proj.weight": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.151.gate_proj.weight_scale": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.151.up_proj.weight": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.151.up_proj.weight_scale": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.152.down_proj.weight": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.152.down_proj.weight_scale": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.152.gate_proj.weight": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.152.gate_proj.weight_scale": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.152.up_proj.weight": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.152.up_proj.weight_scale": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.153.down_proj.weight": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.153.down_proj.weight_scale": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.153.gate_proj.weight": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.153.gate_proj.weight_scale": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.153.up_proj.weight": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.153.up_proj.weight_scale": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.154.down_proj.weight": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.154.down_proj.weight_scale": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.154.gate_proj.weight": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.154.gate_proj.weight_scale": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.154.up_proj.weight": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.154.up_proj.weight_scale": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.155.down_proj.weight": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.155.down_proj.weight_scale": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.155.gate_proj.weight": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.155.gate_proj.weight_scale": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.155.up_proj.weight": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.155.up_proj.weight_scale": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.156.down_proj.weight": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.156.down_proj.weight_scale": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.156.gate_proj.weight": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.156.gate_proj.weight_scale": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.156.up_proj.weight": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.156.up_proj.weight_scale": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.157.down_proj.weight": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.157.down_proj.weight_scale": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.157.gate_proj.weight": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.157.gate_proj.weight_scale": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.157.up_proj.weight": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.157.up_proj.weight_scale": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.158.down_proj.weight": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.158.down_proj.weight_scale": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.158.gate_proj.weight": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.158.gate_proj.weight_scale": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.158.up_proj.weight": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.158.up_proj.weight_scale": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.159.down_proj.weight": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.159.down_proj.weight_scale": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.159.gate_proj.weight": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.159.gate_proj.weight_scale": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.159.up_proj.weight": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.159.up_proj.weight_scale": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.16.down_proj.weight": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.16.down_proj.weight_scale": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.16.gate_proj.weight": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.16.gate_proj.weight_scale": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.16.up_proj.weight": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.16.up_proj.weight_scale": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.17.down_proj.weight": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.17.down_proj.weight_scale": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.17.gate_proj.weight": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.17.gate_proj.weight_scale": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.17.up_proj.weight": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.17.up_proj.weight_scale": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.18.down_proj.weight": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.18.down_proj.weight_scale": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.18.gate_proj.weight": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.18.gate_proj.weight_scale": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.18.up_proj.weight": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.18.up_proj.weight_scale": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.19.down_proj.weight": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.19.down_proj.weight_scale": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.19.gate_proj.weight": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.19.gate_proj.weight_scale": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.19.up_proj.weight": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.19.up_proj.weight_scale": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.2.down_proj.weight": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.2.down_proj.weight_scale": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.2.gate_proj.weight": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.2.gate_proj.weight_scale": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.2.up_proj.weight": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.2.up_proj.weight_scale": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.20.down_proj.weight": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.20.down_proj.weight_scale": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.20.gate_proj.weight": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.20.gate_proj.weight_scale": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.20.up_proj.weight": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.20.up_proj.weight_scale": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.21.down_proj.weight": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.21.down_proj.weight_scale": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.21.gate_proj.weight": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.21.gate_proj.weight_scale": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.21.up_proj.weight": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.21.up_proj.weight_scale": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.22.down_proj.weight": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.22.down_proj.weight_scale": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.22.gate_proj.weight": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.22.gate_proj.weight_scale": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.22.up_proj.weight": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.22.up_proj.weight_scale": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.23.down_proj.weight": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.23.down_proj.weight_scale": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.23.gate_proj.weight": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.23.gate_proj.weight_scale": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.23.up_proj.weight": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.23.up_proj.weight_scale": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.24.down_proj.weight": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.24.down_proj.weight_scale": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.24.gate_proj.weight": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.24.gate_proj.weight_scale": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.24.up_proj.weight": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.24.up_proj.weight_scale": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.25.down_proj.weight": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.25.down_proj.weight_scale": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.25.gate_proj.weight": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.25.gate_proj.weight_scale": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.25.up_proj.weight": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.25.up_proj.weight_scale": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.26.down_proj.weight": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.26.down_proj.weight_scale": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.26.gate_proj.weight": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.26.gate_proj.weight_scale": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.26.up_proj.weight": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.26.up_proj.weight_scale": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.27.down_proj.weight": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.27.down_proj.weight_scale": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.27.gate_proj.weight": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.27.gate_proj.weight_scale": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.27.up_proj.weight": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.27.up_proj.weight_scale": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.28.down_proj.weight": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.28.down_proj.weight_scale": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.28.gate_proj.weight": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.28.gate_proj.weight_scale": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.28.up_proj.weight": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.28.up_proj.weight_scale": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.29.down_proj.weight": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.29.down_proj.weight_scale": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.29.gate_proj.weight": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.29.gate_proj.weight_scale": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.29.up_proj.weight": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.29.up_proj.weight_scale": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.3.down_proj.weight": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.3.down_proj.weight_scale": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.3.gate_proj.weight": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.3.gate_proj.weight_scale": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.3.up_proj.weight": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.3.up_proj.weight_scale": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.30.down_proj.weight": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.30.down_proj.weight_scale": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.30.gate_proj.weight": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.30.gate_proj.weight_scale": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.30.up_proj.weight": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.30.up_proj.weight_scale": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.31.down_proj.weight": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.31.down_proj.weight_scale": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.31.gate_proj.weight": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.31.gate_proj.weight_scale": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.31.up_proj.weight": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.31.up_proj.weight_scale": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.32.down_proj.weight": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.32.down_proj.weight_scale": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.32.gate_proj.weight": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.32.gate_proj.weight_scale": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.32.up_proj.weight": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.32.up_proj.weight_scale": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.33.down_proj.weight": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.33.down_proj.weight_scale": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.33.gate_proj.weight": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.33.gate_proj.weight_scale": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.33.up_proj.weight": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.33.up_proj.weight_scale": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.34.down_proj.weight": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.34.down_proj.weight_scale": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.34.gate_proj.weight": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.34.gate_proj.weight_scale": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.34.up_proj.weight": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.34.up_proj.weight_scale": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.35.down_proj.weight": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.35.down_proj.weight_scale": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.35.gate_proj.weight": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.35.gate_proj.weight_scale": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.35.up_proj.weight": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.35.up_proj.weight_scale": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.36.down_proj.weight": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.36.down_proj.weight_scale": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.36.gate_proj.weight": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.36.gate_proj.weight_scale": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.36.up_proj.weight": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.36.up_proj.weight_scale": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.37.down_proj.weight": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.37.down_proj.weight_scale": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.37.gate_proj.weight": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.37.gate_proj.weight_scale": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.37.up_proj.weight": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.37.up_proj.weight_scale": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.38.down_proj.weight": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.38.down_proj.weight_scale": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.38.gate_proj.weight": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.38.gate_proj.weight_scale": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.38.up_proj.weight": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.38.up_proj.weight_scale": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.39.down_proj.weight": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.39.down_proj.weight_scale": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.39.gate_proj.weight": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.39.gate_proj.weight_scale": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.39.up_proj.weight": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.39.up_proj.weight_scale": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.4.down_proj.weight": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.4.down_proj.weight_scale": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.4.gate_proj.weight": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.4.gate_proj.weight_scale": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.4.up_proj.weight": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.4.up_proj.weight_scale": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.40.down_proj.weight": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.40.down_proj.weight_scale": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.40.gate_proj.weight": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.40.gate_proj.weight_scale": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.40.up_proj.weight": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.40.up_proj.weight_scale": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.41.down_proj.weight": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.41.down_proj.weight_scale": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.41.gate_proj.weight": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.41.gate_proj.weight_scale": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.41.up_proj.weight": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.41.up_proj.weight_scale": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.42.down_proj.weight": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.42.down_proj.weight_scale": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.42.gate_proj.weight": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.42.gate_proj.weight_scale": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.42.up_proj.weight": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.42.up_proj.weight_scale": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.43.down_proj.weight": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.43.down_proj.weight_scale": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.43.gate_proj.weight": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.43.gate_proj.weight_scale": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.43.up_proj.weight": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.43.up_proj.weight_scale": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.44.down_proj.weight": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.44.down_proj.weight_scale": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.44.gate_proj.weight": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.44.gate_proj.weight_scale": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.44.up_proj.weight": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.44.up_proj.weight_scale": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.45.down_proj.weight": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.45.down_proj.weight_scale": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.45.gate_proj.weight": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.45.gate_proj.weight_scale": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.45.up_proj.weight": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.45.up_proj.weight_scale": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.46.down_proj.weight": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.46.down_proj.weight_scale": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.46.gate_proj.weight": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.46.gate_proj.weight_scale": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.46.up_proj.weight": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.46.up_proj.weight_scale": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.47.down_proj.weight": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.47.down_proj.weight_scale": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.47.gate_proj.weight": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.47.gate_proj.weight_scale": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.47.up_proj.weight": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.47.up_proj.weight_scale": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.48.down_proj.weight": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.48.down_proj.weight_scale": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.48.gate_proj.weight": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.48.gate_proj.weight_scale": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.48.up_proj.weight": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.48.up_proj.weight_scale": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.49.down_proj.weight": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.49.down_proj.weight_scale": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.49.gate_proj.weight": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.49.gate_proj.weight_scale": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.49.up_proj.weight": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.49.up_proj.weight_scale": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.5.down_proj.weight": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.5.down_proj.weight_scale": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.5.gate_proj.weight": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.5.gate_proj.weight_scale": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.5.up_proj.weight": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.5.up_proj.weight_scale": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.50.down_proj.weight": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.50.down_proj.weight_scale": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.50.gate_proj.weight": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.50.gate_proj.weight_scale": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.50.up_proj.weight": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.50.up_proj.weight_scale": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.51.down_proj.weight": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.51.down_proj.weight_scale": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.51.gate_proj.weight": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.51.gate_proj.weight_scale": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.51.up_proj.weight": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.51.up_proj.weight_scale": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.52.down_proj.weight": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.52.down_proj.weight_scale": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.52.gate_proj.weight": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.52.gate_proj.weight_scale": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.52.up_proj.weight": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.52.up_proj.weight_scale": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.53.down_proj.weight": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.53.down_proj.weight_scale": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.53.gate_proj.weight": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.53.gate_proj.weight_scale": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.53.up_proj.weight": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.53.up_proj.weight_scale": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.54.down_proj.weight": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.54.down_proj.weight_scale": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.54.gate_proj.weight": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.54.gate_proj.weight_scale": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.54.up_proj.weight": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.54.up_proj.weight_scale": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.55.down_proj.weight": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.55.down_proj.weight_scale": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.55.gate_proj.weight": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.55.gate_proj.weight_scale": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.55.up_proj.weight": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.55.up_proj.weight_scale": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.56.down_proj.weight": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.56.down_proj.weight_scale": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.56.gate_proj.weight": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.56.gate_proj.weight_scale": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.56.up_proj.weight": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.56.up_proj.weight_scale": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.57.down_proj.weight": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.57.down_proj.weight_scale": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.57.gate_proj.weight": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.57.gate_proj.weight_scale": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.57.up_proj.weight": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.57.up_proj.weight_scale": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.58.down_proj.weight": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.58.down_proj.weight_scale": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.58.gate_proj.weight": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.58.gate_proj.weight_scale": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.58.up_proj.weight": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.58.up_proj.weight_scale": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.59.down_proj.weight": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.59.down_proj.weight_scale": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.59.gate_proj.weight": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.59.gate_proj.weight_scale": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.59.up_proj.weight": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.59.up_proj.weight_scale": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.6.down_proj.weight": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.6.down_proj.weight_scale": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.6.gate_proj.weight": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.6.gate_proj.weight_scale": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.6.up_proj.weight": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.6.up_proj.weight_scale": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.60.down_proj.weight": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.60.down_proj.weight_scale": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.60.gate_proj.weight": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.60.gate_proj.weight_scale": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.60.up_proj.weight": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.60.up_proj.weight_scale": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.61.down_proj.weight": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.61.down_proj.weight_scale": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.61.gate_proj.weight": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.61.gate_proj.weight_scale": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.61.up_proj.weight": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.61.up_proj.weight_scale": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.62.down_proj.weight": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.62.down_proj.weight_scale": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.62.gate_proj.weight": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.62.gate_proj.weight_scale": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.62.up_proj.weight": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.62.up_proj.weight_scale": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.63.down_proj.weight": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.63.down_proj.weight_scale": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.63.gate_proj.weight": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.63.gate_proj.weight_scale": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.63.up_proj.weight": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.63.up_proj.weight_scale": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.64.down_proj.weight": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.64.down_proj.weight_scale": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.64.gate_proj.weight": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.64.gate_proj.weight_scale": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.64.up_proj.weight": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.64.up_proj.weight_scale": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.65.down_proj.weight": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.65.down_proj.weight_scale": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.65.gate_proj.weight": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.65.gate_proj.weight_scale": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.65.up_proj.weight": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.65.up_proj.weight_scale": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.66.down_proj.weight": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.66.down_proj.weight_scale": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.66.gate_proj.weight": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.66.gate_proj.weight_scale": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.66.up_proj.weight": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.66.up_proj.weight_scale": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.67.down_proj.weight": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.67.down_proj.weight_scale": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.67.gate_proj.weight": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.67.gate_proj.weight_scale": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.67.up_proj.weight": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.67.up_proj.weight_scale": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.68.down_proj.weight": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.68.down_proj.weight_scale": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.68.gate_proj.weight": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.68.gate_proj.weight_scale": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.68.up_proj.weight": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.68.up_proj.weight_scale": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.69.down_proj.weight": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.69.down_proj.weight_scale": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.69.gate_proj.weight": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.69.gate_proj.weight_scale": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.69.up_proj.weight": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.69.up_proj.weight_scale": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.7.down_proj.weight": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.7.down_proj.weight_scale": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.7.gate_proj.weight": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.7.gate_proj.weight_scale": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.7.up_proj.weight": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.7.up_proj.weight_scale": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.70.down_proj.weight": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.70.down_proj.weight_scale": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.70.gate_proj.weight": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.70.gate_proj.weight_scale": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.70.up_proj.weight": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.70.up_proj.weight_scale": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.71.down_proj.weight": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.71.down_proj.weight_scale": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.71.gate_proj.weight": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.71.gate_proj.weight_scale": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.71.up_proj.weight": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.71.up_proj.weight_scale": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.72.down_proj.weight": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.72.down_proj.weight_scale": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.72.gate_proj.weight": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.72.gate_proj.weight_scale": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.72.up_proj.weight": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.72.up_proj.weight_scale": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.73.down_proj.weight": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.73.down_proj.weight_scale": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.73.gate_proj.weight": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.73.gate_proj.weight_scale": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.73.up_proj.weight": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.73.up_proj.weight_scale": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.74.down_proj.weight": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.74.down_proj.weight_scale": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.74.gate_proj.weight": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.74.gate_proj.weight_scale": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.74.up_proj.weight": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.74.up_proj.weight_scale": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.75.down_proj.weight": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.75.down_proj.weight_scale": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.75.gate_proj.weight": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.75.gate_proj.weight_scale": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.75.up_proj.weight": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.75.up_proj.weight_scale": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.76.down_proj.weight": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.76.down_proj.weight_scale": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.76.gate_proj.weight": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.76.gate_proj.weight_scale": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.76.up_proj.weight": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.76.up_proj.weight_scale": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.77.down_proj.weight": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.77.down_proj.weight_scale": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.77.gate_proj.weight": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.77.gate_proj.weight_scale": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.77.up_proj.weight": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.77.up_proj.weight_scale": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.78.down_proj.weight": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.78.down_proj.weight_scale": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.78.gate_proj.weight": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.78.gate_proj.weight_scale": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.78.up_proj.weight": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.78.up_proj.weight_scale": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.79.down_proj.weight": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.79.down_proj.weight_scale": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.79.gate_proj.weight": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.79.gate_proj.weight_scale": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.79.up_proj.weight": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.79.up_proj.weight_scale": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.8.down_proj.weight": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.8.down_proj.weight_scale": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.8.gate_proj.weight": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.8.gate_proj.weight_scale": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.8.up_proj.weight": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.8.up_proj.weight_scale": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.80.down_proj.weight": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.80.down_proj.weight_scale": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.80.gate_proj.weight": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.80.gate_proj.weight_scale": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.80.up_proj.weight": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.80.up_proj.weight_scale": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.81.down_proj.weight": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.81.down_proj.weight_scale": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.81.gate_proj.weight": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.81.gate_proj.weight_scale": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.81.up_proj.weight": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.81.up_proj.weight_scale": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.82.down_proj.weight": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.82.down_proj.weight_scale": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.82.gate_proj.weight": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.82.gate_proj.weight_scale": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.82.up_proj.weight": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.82.up_proj.weight_scale": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.83.down_proj.weight": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.83.down_proj.weight_scale": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.83.gate_proj.weight": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.83.gate_proj.weight_scale": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.83.up_proj.weight": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.83.up_proj.weight_scale": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.84.down_proj.weight": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.84.down_proj.weight_scale": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.84.gate_proj.weight": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.84.gate_proj.weight_scale": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.84.up_proj.weight": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.84.up_proj.weight_scale": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.85.down_proj.weight": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.85.down_proj.weight_scale": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.85.gate_proj.weight": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.85.gate_proj.weight_scale": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.85.up_proj.weight": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.85.up_proj.weight_scale": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.86.down_proj.weight": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.86.down_proj.weight_scale": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.86.gate_proj.weight": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.86.gate_proj.weight_scale": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.86.up_proj.weight": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.86.up_proj.weight_scale": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.87.down_proj.weight": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.87.down_proj.weight_scale": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.87.gate_proj.weight": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.87.gate_proj.weight_scale": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.87.up_proj.weight": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.87.up_proj.weight_scale": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.88.down_proj.weight": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.88.down_proj.weight_scale": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.88.gate_proj.weight": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.88.gate_proj.weight_scale": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.88.up_proj.weight": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.88.up_proj.weight_scale": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.89.down_proj.weight": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.89.down_proj.weight_scale": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.89.gate_proj.weight": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.89.gate_proj.weight_scale": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.89.up_proj.weight": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.89.up_proj.weight_scale": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.9.down_proj.weight": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.9.down_proj.weight_scale": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.9.gate_proj.weight": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.9.gate_proj.weight_scale": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.9.up_proj.weight": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.9.up_proj.weight_scale": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.90.down_proj.weight": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.90.down_proj.weight_scale": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.90.gate_proj.weight": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.90.gate_proj.weight_scale": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.90.up_proj.weight": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.90.up_proj.weight_scale": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.91.down_proj.weight": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.91.down_proj.weight_scale": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.91.gate_proj.weight": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.91.gate_proj.weight_scale": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.91.up_proj.weight": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.91.up_proj.weight_scale": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.92.down_proj.weight": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.92.down_proj.weight_scale": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.92.gate_proj.weight": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.92.gate_proj.weight_scale": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.92.up_proj.weight": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.92.up_proj.weight_scale": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.93.down_proj.weight": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.93.down_proj.weight_scale": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.93.gate_proj.weight": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.93.gate_proj.weight_scale": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.93.up_proj.weight": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.93.up_proj.weight_scale": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.94.down_proj.weight": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.94.down_proj.weight_scale": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.94.gate_proj.weight": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.94.gate_proj.weight_scale": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.94.up_proj.weight": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.94.up_proj.weight_scale": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.95.down_proj.weight": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.95.down_proj.weight_scale": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.95.gate_proj.weight": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.95.gate_proj.weight_scale": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.95.up_proj.weight": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.95.up_proj.weight_scale": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.96.down_proj.weight": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.96.down_proj.weight_scale": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.96.gate_proj.weight": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.96.gate_proj.weight_scale": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.96.up_proj.weight": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.96.up_proj.weight_scale": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.97.down_proj.weight": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.97.down_proj.weight_scale": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.97.gate_proj.weight": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.97.gate_proj.weight_scale": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.97.up_proj.weight": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.97.up_proj.weight_scale": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.98.down_proj.weight": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.98.down_proj.weight_scale": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.98.gate_proj.weight": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.98.gate_proj.weight_scale": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.98.up_proj.weight": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.98.up_proj.weight_scale": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.99.down_proj.weight": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.99.down_proj.weight_scale": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.99.gate_proj.weight": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.99.gate_proj.weight_scale": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.99.up_proj.weight": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.99.up_proj.weight_scale": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.gate.e_score_correction_bias": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.gate.weight": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.shared_experts.down_proj.weight": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.shared_experts.down_proj.weight_scale": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.shared_experts.gate_proj.weight": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.shared_experts.gate_proj.weight_scale": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.shared_experts.up_proj.weight": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.shared_experts.up_proj.weight_scale": "model-00024-of-00092.safetensors",
+ "model.layers.23.post_attention_layernorm.weight": "model-00024-of-00092.safetensors",
+ "model.layers.23.self_attn.k_norm.weight": "model-00024-of-00092.safetensors",
+ "model.layers.23.self_attn.k_proj.bias": "model-00024-of-00092.safetensors",
+ "model.layers.23.self_attn.k_proj.weight": "model-00024-of-00092.safetensors",
+ "model.layers.23.self_attn.k_proj.weight_scale": "model-00024-of-00092.safetensors",
+ "model.layers.23.self_attn.o_proj.weight": "model-00024-of-00092.safetensors",
+ "model.layers.23.self_attn.o_proj.weight_scale": "model-00024-of-00092.safetensors",
+ "model.layers.23.self_attn.q_norm.weight": "model-00024-of-00092.safetensors",
+ "model.layers.23.self_attn.q_proj.bias": "model-00024-of-00092.safetensors",
+ "model.layers.23.self_attn.q_proj.weight": "model-00024-of-00092.safetensors",
+ "model.layers.23.self_attn.q_proj.weight_scale": "model-00024-of-00092.safetensors",
+ "model.layers.23.self_attn.v_proj.bias": "model-00024-of-00092.safetensors",
+ "model.layers.23.self_attn.v_proj.weight": "model-00024-of-00092.safetensors",
+ "model.layers.23.self_attn.v_proj.weight_scale": "model-00024-of-00092.safetensors",
+ "model.layers.24.input_layernorm.weight": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.0.down_proj.weight": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.0.down_proj.weight_scale": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.0.gate_proj.weight": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.0.gate_proj.weight_scale": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.0.up_proj.weight": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.0.up_proj.weight_scale": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.1.down_proj.weight": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.1.down_proj.weight_scale": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.1.gate_proj.weight": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.1.gate_proj.weight_scale": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.1.up_proj.weight": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.1.up_proj.weight_scale": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.10.down_proj.weight": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.10.down_proj.weight_scale": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.10.gate_proj.weight": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.10.gate_proj.weight_scale": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.10.up_proj.weight": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.10.up_proj.weight_scale": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.100.down_proj.weight": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.100.down_proj.weight_scale": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.100.gate_proj.weight": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.100.gate_proj.weight_scale": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.100.up_proj.weight": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.100.up_proj.weight_scale": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.101.down_proj.weight": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.101.down_proj.weight_scale": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.101.gate_proj.weight": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.101.gate_proj.weight_scale": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.101.up_proj.weight": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.101.up_proj.weight_scale": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.102.down_proj.weight": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.102.down_proj.weight_scale": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.102.gate_proj.weight": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.102.gate_proj.weight_scale": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.102.up_proj.weight": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.102.up_proj.weight_scale": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.103.down_proj.weight": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.103.down_proj.weight_scale": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.103.gate_proj.weight": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.103.gate_proj.weight_scale": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.103.up_proj.weight": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.103.up_proj.weight_scale": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.104.down_proj.weight": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.104.down_proj.weight_scale": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.104.gate_proj.weight": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.104.gate_proj.weight_scale": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.104.up_proj.weight": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.104.up_proj.weight_scale": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.105.down_proj.weight": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.105.down_proj.weight_scale": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.105.gate_proj.weight": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.105.gate_proj.weight_scale": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.105.up_proj.weight": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.105.up_proj.weight_scale": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.106.down_proj.weight": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.106.down_proj.weight_scale": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.106.gate_proj.weight": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.106.gate_proj.weight_scale": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.106.up_proj.weight": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.106.up_proj.weight_scale": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.107.down_proj.weight": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.107.down_proj.weight_scale": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.107.gate_proj.weight": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.107.gate_proj.weight_scale": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.107.up_proj.weight": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.107.up_proj.weight_scale": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.108.down_proj.weight": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.108.down_proj.weight_scale": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.108.gate_proj.weight": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.108.gate_proj.weight_scale": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.108.up_proj.weight": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.108.up_proj.weight_scale": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.109.down_proj.weight": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.109.down_proj.weight_scale": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.109.gate_proj.weight": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.109.gate_proj.weight_scale": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.109.up_proj.weight": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.109.up_proj.weight_scale": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.11.down_proj.weight": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.11.down_proj.weight_scale": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.11.gate_proj.weight": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.11.gate_proj.weight_scale": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.11.up_proj.weight": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.11.up_proj.weight_scale": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.110.down_proj.weight": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.110.down_proj.weight_scale": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.110.gate_proj.weight": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.110.gate_proj.weight_scale": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.110.up_proj.weight": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.110.up_proj.weight_scale": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.111.down_proj.weight": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.111.down_proj.weight_scale": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.111.gate_proj.weight": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.111.gate_proj.weight_scale": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.111.up_proj.weight": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.111.up_proj.weight_scale": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.112.down_proj.weight": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.112.down_proj.weight_scale": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.112.gate_proj.weight": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.112.gate_proj.weight_scale": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.112.up_proj.weight": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.112.up_proj.weight_scale": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.113.down_proj.weight": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.113.down_proj.weight_scale": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.113.gate_proj.weight": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.113.gate_proj.weight_scale": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.113.up_proj.weight": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.113.up_proj.weight_scale": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.114.down_proj.weight": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.114.down_proj.weight_scale": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.114.gate_proj.weight": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.114.gate_proj.weight_scale": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.114.up_proj.weight": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.114.up_proj.weight_scale": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.115.down_proj.weight": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.115.down_proj.weight_scale": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.115.gate_proj.weight": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.115.gate_proj.weight_scale": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.115.up_proj.weight": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.115.up_proj.weight_scale": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.116.down_proj.weight": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.116.down_proj.weight_scale": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.116.gate_proj.weight": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.116.gate_proj.weight_scale": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.116.up_proj.weight": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.116.up_proj.weight_scale": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.117.down_proj.weight": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.117.down_proj.weight_scale": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.117.gate_proj.weight": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.117.gate_proj.weight_scale": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.117.up_proj.weight": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.117.up_proj.weight_scale": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.118.down_proj.weight": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.118.down_proj.weight_scale": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.118.gate_proj.weight": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.118.gate_proj.weight_scale": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.118.up_proj.weight": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.118.up_proj.weight_scale": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.119.down_proj.weight": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.119.down_proj.weight_scale": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.119.gate_proj.weight": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.119.gate_proj.weight_scale": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.119.up_proj.weight": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.119.up_proj.weight_scale": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.12.down_proj.weight": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.12.down_proj.weight_scale": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.12.gate_proj.weight": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.12.gate_proj.weight_scale": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.12.up_proj.weight": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.12.up_proj.weight_scale": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.120.down_proj.weight": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.120.down_proj.weight_scale": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.120.gate_proj.weight": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.120.gate_proj.weight_scale": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.120.up_proj.weight": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.120.up_proj.weight_scale": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.121.down_proj.weight": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.121.down_proj.weight_scale": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.121.gate_proj.weight": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.121.gate_proj.weight_scale": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.121.up_proj.weight": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.121.up_proj.weight_scale": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.122.down_proj.weight": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.122.down_proj.weight_scale": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.122.gate_proj.weight": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.122.gate_proj.weight_scale": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.122.up_proj.weight": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.122.up_proj.weight_scale": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.123.down_proj.weight": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.123.down_proj.weight_scale": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.123.gate_proj.weight": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.123.gate_proj.weight_scale": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.123.up_proj.weight": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.123.up_proj.weight_scale": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.124.down_proj.weight": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.124.down_proj.weight_scale": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.124.gate_proj.weight": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.124.gate_proj.weight_scale": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.124.up_proj.weight": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.124.up_proj.weight_scale": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.125.down_proj.weight": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.125.down_proj.weight_scale": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.125.gate_proj.weight": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.125.gate_proj.weight_scale": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.125.up_proj.weight": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.125.up_proj.weight_scale": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.126.down_proj.weight": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.126.down_proj.weight_scale": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.126.gate_proj.weight": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.126.gate_proj.weight_scale": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.126.up_proj.weight": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.126.up_proj.weight_scale": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.127.down_proj.weight": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.127.down_proj.weight_scale": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.127.gate_proj.weight": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.127.gate_proj.weight_scale": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.127.up_proj.weight": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.127.up_proj.weight_scale": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.128.down_proj.weight": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.128.down_proj.weight_scale": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.128.gate_proj.weight": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.128.gate_proj.weight_scale": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.128.up_proj.weight": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.128.up_proj.weight_scale": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.129.down_proj.weight": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.129.down_proj.weight_scale": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.129.gate_proj.weight": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.129.gate_proj.weight_scale": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.129.up_proj.weight": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.129.up_proj.weight_scale": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.13.down_proj.weight": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.13.down_proj.weight_scale": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.13.gate_proj.weight": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.13.gate_proj.weight_scale": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.13.up_proj.weight": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.13.up_proj.weight_scale": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.130.down_proj.weight": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.130.down_proj.weight_scale": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.130.gate_proj.weight": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.130.gate_proj.weight_scale": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.130.up_proj.weight": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.130.up_proj.weight_scale": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.131.down_proj.weight": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.131.down_proj.weight_scale": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.131.gate_proj.weight": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.131.gate_proj.weight_scale": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.131.up_proj.weight": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.131.up_proj.weight_scale": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.132.down_proj.weight": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.132.down_proj.weight_scale": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.132.gate_proj.weight": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.132.gate_proj.weight_scale": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.132.up_proj.weight": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.132.up_proj.weight_scale": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.133.down_proj.weight": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.133.down_proj.weight_scale": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.133.gate_proj.weight": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.133.gate_proj.weight_scale": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.133.up_proj.weight": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.133.up_proj.weight_scale": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.134.down_proj.weight": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.134.down_proj.weight_scale": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.134.gate_proj.weight": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.134.gate_proj.weight_scale": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.134.up_proj.weight": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.134.up_proj.weight_scale": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.135.down_proj.weight": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.135.down_proj.weight_scale": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.135.gate_proj.weight": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.135.gate_proj.weight_scale": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.135.up_proj.weight": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.135.up_proj.weight_scale": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.136.down_proj.weight": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.136.down_proj.weight_scale": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.136.gate_proj.weight": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.136.gate_proj.weight_scale": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.136.up_proj.weight": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.136.up_proj.weight_scale": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.137.down_proj.weight": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.137.down_proj.weight_scale": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.137.gate_proj.weight": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.137.gate_proj.weight_scale": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.137.up_proj.weight": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.137.up_proj.weight_scale": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.138.down_proj.weight": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.138.down_proj.weight_scale": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.138.gate_proj.weight": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.138.gate_proj.weight_scale": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.138.up_proj.weight": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.138.up_proj.weight_scale": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.139.down_proj.weight": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.139.down_proj.weight_scale": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.139.gate_proj.weight": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.139.gate_proj.weight_scale": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.139.up_proj.weight": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.139.up_proj.weight_scale": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.14.down_proj.weight": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.14.down_proj.weight_scale": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.14.gate_proj.weight": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.14.gate_proj.weight_scale": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.14.up_proj.weight": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.14.up_proj.weight_scale": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.140.down_proj.weight": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.140.down_proj.weight_scale": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.140.gate_proj.weight": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.140.gate_proj.weight_scale": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.140.up_proj.weight": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.140.up_proj.weight_scale": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.141.down_proj.weight": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.141.down_proj.weight_scale": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.141.gate_proj.weight": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.141.gate_proj.weight_scale": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.141.up_proj.weight": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.141.up_proj.weight_scale": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.142.down_proj.weight": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.142.down_proj.weight_scale": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.142.gate_proj.weight": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.142.gate_proj.weight_scale": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.142.up_proj.weight": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.142.up_proj.weight_scale": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.143.down_proj.weight": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.143.down_proj.weight_scale": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.143.gate_proj.weight": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.143.gate_proj.weight_scale": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.143.up_proj.weight": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.143.up_proj.weight_scale": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.144.down_proj.weight": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.144.down_proj.weight_scale": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.144.gate_proj.weight": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.144.gate_proj.weight_scale": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.144.up_proj.weight": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.144.up_proj.weight_scale": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.145.down_proj.weight": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.145.down_proj.weight_scale": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.145.gate_proj.weight": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.145.gate_proj.weight_scale": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.145.up_proj.weight": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.145.up_proj.weight_scale": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.146.down_proj.weight": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.146.down_proj.weight_scale": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.146.gate_proj.weight": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.146.gate_proj.weight_scale": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.146.up_proj.weight": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.146.up_proj.weight_scale": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.147.down_proj.weight": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.147.down_proj.weight_scale": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.147.gate_proj.weight": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.147.gate_proj.weight_scale": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.147.up_proj.weight": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.147.up_proj.weight_scale": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.148.down_proj.weight": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.148.down_proj.weight_scale": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.148.gate_proj.weight": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.148.gate_proj.weight_scale": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.148.up_proj.weight": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.148.up_proj.weight_scale": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.149.down_proj.weight": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.149.down_proj.weight_scale": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.149.gate_proj.weight": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.149.gate_proj.weight_scale": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.149.up_proj.weight": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.149.up_proj.weight_scale": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.15.down_proj.weight": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.15.down_proj.weight_scale": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.15.gate_proj.weight": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.15.gate_proj.weight_scale": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.15.up_proj.weight": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.15.up_proj.weight_scale": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.150.down_proj.weight": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.150.down_proj.weight_scale": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.150.gate_proj.weight": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.150.gate_proj.weight_scale": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.150.up_proj.weight": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.150.up_proj.weight_scale": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.151.down_proj.weight": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.151.down_proj.weight_scale": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.151.gate_proj.weight": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.151.gate_proj.weight_scale": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.151.up_proj.weight": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.151.up_proj.weight_scale": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.152.down_proj.weight": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.152.down_proj.weight_scale": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.152.gate_proj.weight": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.152.gate_proj.weight_scale": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.152.up_proj.weight": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.152.up_proj.weight_scale": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.153.down_proj.weight": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.153.down_proj.weight_scale": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.153.gate_proj.weight": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.153.gate_proj.weight_scale": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.153.up_proj.weight": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.153.up_proj.weight_scale": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.154.down_proj.weight": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.154.down_proj.weight_scale": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.154.gate_proj.weight": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.154.gate_proj.weight_scale": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.154.up_proj.weight": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.154.up_proj.weight_scale": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.155.down_proj.weight": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.155.down_proj.weight_scale": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.155.gate_proj.weight": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.155.gate_proj.weight_scale": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.155.up_proj.weight": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.155.up_proj.weight_scale": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.156.down_proj.weight": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.156.down_proj.weight_scale": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.156.gate_proj.weight": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.156.gate_proj.weight_scale": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.156.up_proj.weight": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.156.up_proj.weight_scale": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.157.down_proj.weight": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.157.down_proj.weight_scale": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.157.gate_proj.weight": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.157.gate_proj.weight_scale": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.157.up_proj.weight": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.157.up_proj.weight_scale": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.158.down_proj.weight": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.158.down_proj.weight_scale": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.158.gate_proj.weight": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.158.gate_proj.weight_scale": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.158.up_proj.weight": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.158.up_proj.weight_scale": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.159.down_proj.weight": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.159.down_proj.weight_scale": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.159.gate_proj.weight": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.159.gate_proj.weight_scale": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.159.up_proj.weight": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.159.up_proj.weight_scale": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.16.down_proj.weight": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.16.down_proj.weight_scale": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.16.gate_proj.weight": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.16.gate_proj.weight_scale": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.16.up_proj.weight": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.16.up_proj.weight_scale": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.17.down_proj.weight": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.17.down_proj.weight_scale": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.17.gate_proj.weight": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.17.gate_proj.weight_scale": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.17.up_proj.weight": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.17.up_proj.weight_scale": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.18.down_proj.weight": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.18.down_proj.weight_scale": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.18.gate_proj.weight": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.18.gate_proj.weight_scale": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.18.up_proj.weight": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.18.up_proj.weight_scale": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.19.down_proj.weight": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.19.down_proj.weight_scale": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.19.gate_proj.weight": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.19.gate_proj.weight_scale": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.19.up_proj.weight": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.19.up_proj.weight_scale": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.2.down_proj.weight": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.2.down_proj.weight_scale": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.2.gate_proj.weight": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.2.gate_proj.weight_scale": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.2.up_proj.weight": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.2.up_proj.weight_scale": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.20.down_proj.weight": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.20.down_proj.weight_scale": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.20.gate_proj.weight": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.20.gate_proj.weight_scale": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.20.up_proj.weight": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.20.up_proj.weight_scale": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.21.down_proj.weight": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.21.down_proj.weight_scale": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.21.gate_proj.weight": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.21.gate_proj.weight_scale": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.21.up_proj.weight": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.21.up_proj.weight_scale": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.22.down_proj.weight": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.22.down_proj.weight_scale": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.22.gate_proj.weight": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.22.gate_proj.weight_scale": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.22.up_proj.weight": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.22.up_proj.weight_scale": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.23.down_proj.weight": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.23.down_proj.weight_scale": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.23.gate_proj.weight": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.23.gate_proj.weight_scale": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.23.up_proj.weight": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.23.up_proj.weight_scale": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.24.down_proj.weight": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.24.down_proj.weight_scale": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.24.gate_proj.weight": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.24.gate_proj.weight_scale": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.24.up_proj.weight": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.24.up_proj.weight_scale": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.25.down_proj.weight": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.25.down_proj.weight_scale": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.25.gate_proj.weight": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.25.gate_proj.weight_scale": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.25.up_proj.weight": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.25.up_proj.weight_scale": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.26.down_proj.weight": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.26.down_proj.weight_scale": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.26.gate_proj.weight": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.26.gate_proj.weight_scale": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.26.up_proj.weight": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.26.up_proj.weight_scale": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.27.down_proj.weight": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.27.down_proj.weight_scale": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.27.gate_proj.weight": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.27.gate_proj.weight_scale": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.27.up_proj.weight": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.27.up_proj.weight_scale": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.28.down_proj.weight": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.28.down_proj.weight_scale": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.28.gate_proj.weight": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.28.gate_proj.weight_scale": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.28.up_proj.weight": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.28.up_proj.weight_scale": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.29.down_proj.weight": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.29.down_proj.weight_scale": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.29.gate_proj.weight": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.29.gate_proj.weight_scale": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.29.up_proj.weight": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.29.up_proj.weight_scale": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.3.down_proj.weight": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.3.down_proj.weight_scale": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.3.gate_proj.weight": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.3.gate_proj.weight_scale": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.3.up_proj.weight": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.3.up_proj.weight_scale": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.30.down_proj.weight": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.30.down_proj.weight_scale": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.30.gate_proj.weight": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.30.gate_proj.weight_scale": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.30.up_proj.weight": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.30.up_proj.weight_scale": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.31.down_proj.weight": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.31.down_proj.weight_scale": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.31.gate_proj.weight": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.31.gate_proj.weight_scale": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.31.up_proj.weight": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.31.up_proj.weight_scale": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.32.down_proj.weight": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.32.down_proj.weight_scale": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.32.gate_proj.weight": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.32.gate_proj.weight_scale": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.32.up_proj.weight": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.32.up_proj.weight_scale": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.33.down_proj.weight": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.33.down_proj.weight_scale": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.33.gate_proj.weight": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.33.gate_proj.weight_scale": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.33.up_proj.weight": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.33.up_proj.weight_scale": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.34.down_proj.weight": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.34.down_proj.weight_scale": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.34.gate_proj.weight": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.34.gate_proj.weight_scale": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.34.up_proj.weight": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.34.up_proj.weight_scale": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.35.down_proj.weight": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.35.down_proj.weight_scale": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.35.gate_proj.weight": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.35.gate_proj.weight_scale": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.35.up_proj.weight": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.35.up_proj.weight_scale": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.36.down_proj.weight": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.36.down_proj.weight_scale": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.36.gate_proj.weight": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.36.gate_proj.weight_scale": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.36.up_proj.weight": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.36.up_proj.weight_scale": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.37.down_proj.weight": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.37.down_proj.weight_scale": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.37.gate_proj.weight": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.37.gate_proj.weight_scale": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.37.up_proj.weight": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.37.up_proj.weight_scale": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.38.down_proj.weight": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.38.down_proj.weight_scale": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.38.gate_proj.weight": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.38.gate_proj.weight_scale": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.38.up_proj.weight": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.38.up_proj.weight_scale": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.39.down_proj.weight": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.39.down_proj.weight_scale": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.39.gate_proj.weight": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.39.gate_proj.weight_scale": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.39.up_proj.weight": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.39.up_proj.weight_scale": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.4.down_proj.weight": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.4.down_proj.weight_scale": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.4.gate_proj.weight": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.4.gate_proj.weight_scale": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.4.up_proj.weight": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.4.up_proj.weight_scale": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.40.down_proj.weight": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.40.down_proj.weight_scale": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.40.gate_proj.weight": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.40.gate_proj.weight_scale": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.40.up_proj.weight": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.40.up_proj.weight_scale": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.41.down_proj.weight": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.41.down_proj.weight_scale": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.41.gate_proj.weight": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.41.gate_proj.weight_scale": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.41.up_proj.weight": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.41.up_proj.weight_scale": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.42.down_proj.weight": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.42.down_proj.weight_scale": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.42.gate_proj.weight": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.42.gate_proj.weight_scale": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.42.up_proj.weight": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.42.up_proj.weight_scale": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.43.down_proj.weight": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.43.down_proj.weight_scale": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.43.gate_proj.weight": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.43.gate_proj.weight_scale": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.43.up_proj.weight": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.43.up_proj.weight_scale": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.44.down_proj.weight": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.44.down_proj.weight_scale": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.44.gate_proj.weight": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.44.gate_proj.weight_scale": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.44.up_proj.weight": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.44.up_proj.weight_scale": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.45.down_proj.weight": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.45.down_proj.weight_scale": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.45.gate_proj.weight": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.45.gate_proj.weight_scale": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.45.up_proj.weight": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.45.up_proj.weight_scale": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.46.down_proj.weight": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.46.down_proj.weight_scale": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.46.gate_proj.weight": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.46.gate_proj.weight_scale": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.46.up_proj.weight": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.46.up_proj.weight_scale": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.47.down_proj.weight": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.47.down_proj.weight_scale": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.47.gate_proj.weight": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.47.gate_proj.weight_scale": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.47.up_proj.weight": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.47.up_proj.weight_scale": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.48.down_proj.weight": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.48.down_proj.weight_scale": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.48.gate_proj.weight": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.48.gate_proj.weight_scale": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.48.up_proj.weight": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.48.up_proj.weight_scale": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.49.down_proj.weight": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.49.down_proj.weight_scale": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.49.gate_proj.weight": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.49.gate_proj.weight_scale": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.49.up_proj.weight": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.49.up_proj.weight_scale": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.5.down_proj.weight": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.5.down_proj.weight_scale": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.5.gate_proj.weight": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.5.gate_proj.weight_scale": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.5.up_proj.weight": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.5.up_proj.weight_scale": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.50.down_proj.weight": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.50.down_proj.weight_scale": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.50.gate_proj.weight": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.50.gate_proj.weight_scale": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.50.up_proj.weight": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.50.up_proj.weight_scale": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.51.down_proj.weight": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.51.down_proj.weight_scale": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.51.gate_proj.weight": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.51.gate_proj.weight_scale": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.51.up_proj.weight": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.51.up_proj.weight_scale": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.52.down_proj.weight": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.52.down_proj.weight_scale": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.52.gate_proj.weight": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.52.gate_proj.weight_scale": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.52.up_proj.weight": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.52.up_proj.weight_scale": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.53.down_proj.weight": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.53.down_proj.weight_scale": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.53.gate_proj.weight": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.53.gate_proj.weight_scale": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.53.up_proj.weight": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.53.up_proj.weight_scale": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.54.down_proj.weight": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.54.down_proj.weight_scale": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.54.gate_proj.weight": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.54.gate_proj.weight_scale": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.54.up_proj.weight": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.54.up_proj.weight_scale": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.55.down_proj.weight": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.55.down_proj.weight_scale": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.55.gate_proj.weight": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.55.gate_proj.weight_scale": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.55.up_proj.weight": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.55.up_proj.weight_scale": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.56.down_proj.weight": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.56.down_proj.weight_scale": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.56.gate_proj.weight": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.56.gate_proj.weight_scale": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.56.up_proj.weight": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.56.up_proj.weight_scale": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.57.down_proj.weight": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.57.down_proj.weight_scale": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.57.gate_proj.weight": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.57.gate_proj.weight_scale": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.57.up_proj.weight": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.57.up_proj.weight_scale": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.58.down_proj.weight": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.58.down_proj.weight_scale": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.58.gate_proj.weight": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.58.gate_proj.weight_scale": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.58.up_proj.weight": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.58.up_proj.weight_scale": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.59.down_proj.weight": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.59.down_proj.weight_scale": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.59.gate_proj.weight": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.59.gate_proj.weight_scale": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.59.up_proj.weight": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.59.up_proj.weight_scale": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.6.down_proj.weight": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.6.down_proj.weight_scale": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.6.gate_proj.weight": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.6.gate_proj.weight_scale": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.6.up_proj.weight": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.6.up_proj.weight_scale": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.60.down_proj.weight": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.60.down_proj.weight_scale": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.60.gate_proj.weight": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.60.gate_proj.weight_scale": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.60.up_proj.weight": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.60.up_proj.weight_scale": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.61.down_proj.weight": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.61.down_proj.weight_scale": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.61.gate_proj.weight": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.61.gate_proj.weight_scale": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.61.up_proj.weight": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.61.up_proj.weight_scale": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.62.down_proj.weight": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.62.down_proj.weight_scale": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.62.gate_proj.weight": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.62.gate_proj.weight_scale": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.62.up_proj.weight": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.62.up_proj.weight_scale": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.63.down_proj.weight": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.63.down_proj.weight_scale": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.63.gate_proj.weight": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.63.gate_proj.weight_scale": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.63.up_proj.weight": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.63.up_proj.weight_scale": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.64.down_proj.weight": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.64.down_proj.weight_scale": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.64.gate_proj.weight": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.64.gate_proj.weight_scale": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.64.up_proj.weight": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.64.up_proj.weight_scale": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.65.down_proj.weight": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.65.down_proj.weight_scale": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.65.gate_proj.weight": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.65.gate_proj.weight_scale": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.65.up_proj.weight": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.65.up_proj.weight_scale": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.66.down_proj.weight": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.66.down_proj.weight_scale": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.66.gate_proj.weight": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.66.gate_proj.weight_scale": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.66.up_proj.weight": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.66.up_proj.weight_scale": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.67.down_proj.weight": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.67.down_proj.weight_scale": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.67.gate_proj.weight": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.67.gate_proj.weight_scale": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.67.up_proj.weight": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.67.up_proj.weight_scale": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.68.down_proj.weight": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.68.down_proj.weight_scale": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.68.gate_proj.weight": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.68.gate_proj.weight_scale": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.68.up_proj.weight": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.68.up_proj.weight_scale": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.69.down_proj.weight": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.69.down_proj.weight_scale": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.69.gate_proj.weight": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.69.gate_proj.weight_scale": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.69.up_proj.weight": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.69.up_proj.weight_scale": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.7.down_proj.weight": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.7.down_proj.weight_scale": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.7.gate_proj.weight": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.7.gate_proj.weight_scale": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.7.up_proj.weight": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.7.up_proj.weight_scale": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.70.down_proj.weight": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.70.down_proj.weight_scale": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.70.gate_proj.weight": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.70.gate_proj.weight_scale": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.70.up_proj.weight": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.70.up_proj.weight_scale": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.71.down_proj.weight": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.71.down_proj.weight_scale": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.71.gate_proj.weight": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.71.gate_proj.weight_scale": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.71.up_proj.weight": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.71.up_proj.weight_scale": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.72.down_proj.weight": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.72.down_proj.weight_scale": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.72.gate_proj.weight": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.72.gate_proj.weight_scale": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.72.up_proj.weight": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.72.up_proj.weight_scale": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.73.down_proj.weight": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.73.down_proj.weight_scale": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.73.gate_proj.weight": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.73.gate_proj.weight_scale": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.73.up_proj.weight": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.73.up_proj.weight_scale": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.74.down_proj.weight": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.74.down_proj.weight_scale": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.74.gate_proj.weight": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.74.gate_proj.weight_scale": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.74.up_proj.weight": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.74.up_proj.weight_scale": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.75.down_proj.weight": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.75.down_proj.weight_scale": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.75.gate_proj.weight": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.75.gate_proj.weight_scale": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.75.up_proj.weight": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.75.up_proj.weight_scale": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.76.down_proj.weight": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.76.down_proj.weight_scale": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.76.gate_proj.weight": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.76.gate_proj.weight_scale": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.76.up_proj.weight": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.76.up_proj.weight_scale": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.77.down_proj.weight": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.77.down_proj.weight_scale": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.77.gate_proj.weight": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.77.gate_proj.weight_scale": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.77.up_proj.weight": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.77.up_proj.weight_scale": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.78.down_proj.weight": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.78.down_proj.weight_scale": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.78.gate_proj.weight": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.78.gate_proj.weight_scale": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.78.up_proj.weight": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.78.up_proj.weight_scale": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.79.down_proj.weight": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.79.down_proj.weight_scale": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.79.gate_proj.weight": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.79.gate_proj.weight_scale": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.79.up_proj.weight": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.79.up_proj.weight_scale": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.8.down_proj.weight": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.8.down_proj.weight_scale": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.8.gate_proj.weight": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.8.gate_proj.weight_scale": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.8.up_proj.weight": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.8.up_proj.weight_scale": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.80.down_proj.weight": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.80.down_proj.weight_scale": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.80.gate_proj.weight": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.80.gate_proj.weight_scale": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.80.up_proj.weight": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.80.up_proj.weight_scale": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.81.down_proj.weight": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.81.down_proj.weight_scale": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.81.gate_proj.weight": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.81.gate_proj.weight_scale": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.81.up_proj.weight": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.81.up_proj.weight_scale": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.82.down_proj.weight": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.82.down_proj.weight_scale": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.82.gate_proj.weight": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.82.gate_proj.weight_scale": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.82.up_proj.weight": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.82.up_proj.weight_scale": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.83.down_proj.weight": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.83.down_proj.weight_scale": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.83.gate_proj.weight": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.83.gate_proj.weight_scale": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.83.up_proj.weight": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.83.up_proj.weight_scale": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.84.down_proj.weight": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.84.down_proj.weight_scale": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.84.gate_proj.weight": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.84.gate_proj.weight_scale": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.84.up_proj.weight": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.84.up_proj.weight_scale": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.85.down_proj.weight": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.85.down_proj.weight_scale": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.85.gate_proj.weight": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.85.gate_proj.weight_scale": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.85.up_proj.weight": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.85.up_proj.weight_scale": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.86.down_proj.weight": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.86.down_proj.weight_scale": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.86.gate_proj.weight": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.86.gate_proj.weight_scale": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.86.up_proj.weight": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.86.up_proj.weight_scale": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.87.down_proj.weight": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.87.down_proj.weight_scale": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.87.gate_proj.weight": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.87.gate_proj.weight_scale": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.87.up_proj.weight": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.87.up_proj.weight_scale": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.88.down_proj.weight": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.88.down_proj.weight_scale": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.88.gate_proj.weight": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.88.gate_proj.weight_scale": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.88.up_proj.weight": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.88.up_proj.weight_scale": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.89.down_proj.weight": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.89.down_proj.weight_scale": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.89.gate_proj.weight": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.89.gate_proj.weight_scale": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.89.up_proj.weight": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.89.up_proj.weight_scale": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.9.down_proj.weight": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.9.down_proj.weight_scale": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.9.gate_proj.weight": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.9.gate_proj.weight_scale": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.9.up_proj.weight": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.9.up_proj.weight_scale": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.90.down_proj.weight": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.90.down_proj.weight_scale": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.90.gate_proj.weight": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.90.gate_proj.weight_scale": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.90.up_proj.weight": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.90.up_proj.weight_scale": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.91.down_proj.weight": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.91.down_proj.weight_scale": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.91.gate_proj.weight": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.91.gate_proj.weight_scale": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.91.up_proj.weight": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.91.up_proj.weight_scale": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.92.down_proj.weight": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.92.down_proj.weight_scale": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.92.gate_proj.weight": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.92.gate_proj.weight_scale": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.92.up_proj.weight": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.92.up_proj.weight_scale": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.93.down_proj.weight": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.93.down_proj.weight_scale": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.93.gate_proj.weight": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.93.gate_proj.weight_scale": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.93.up_proj.weight": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.93.up_proj.weight_scale": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.94.down_proj.weight": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.94.down_proj.weight_scale": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.94.gate_proj.weight": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.94.gate_proj.weight_scale": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.94.up_proj.weight": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.94.up_proj.weight_scale": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.95.down_proj.weight": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.95.down_proj.weight_scale": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.95.gate_proj.weight": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.95.gate_proj.weight_scale": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.95.up_proj.weight": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.95.up_proj.weight_scale": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.96.down_proj.weight": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.96.down_proj.weight_scale": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.96.gate_proj.weight": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.96.gate_proj.weight_scale": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.96.up_proj.weight": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.96.up_proj.weight_scale": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.97.down_proj.weight": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.97.down_proj.weight_scale": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.97.gate_proj.weight": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.97.gate_proj.weight_scale": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.97.up_proj.weight": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.97.up_proj.weight_scale": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.98.down_proj.weight": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.98.down_proj.weight_scale": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.98.gate_proj.weight": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.98.gate_proj.weight_scale": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.98.up_proj.weight": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.98.up_proj.weight_scale": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.99.down_proj.weight": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.99.down_proj.weight_scale": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.99.gate_proj.weight": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.99.gate_proj.weight_scale": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.99.up_proj.weight": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.99.up_proj.weight_scale": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.gate.e_score_correction_bias": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.gate.weight": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.shared_experts.down_proj.weight": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.shared_experts.down_proj.weight_scale": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.shared_experts.gate_proj.weight": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.shared_experts.gate_proj.weight_scale": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.shared_experts.up_proj.weight": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.shared_experts.up_proj.weight_scale": "model-00025-of-00092.safetensors",
+ "model.layers.24.post_attention_layernorm.weight": "model-00025-of-00092.safetensors",
+ "model.layers.24.self_attn.k_norm.weight": "model-00025-of-00092.safetensors",
+ "model.layers.24.self_attn.k_proj.bias": "model-00025-of-00092.safetensors",
+ "model.layers.24.self_attn.k_proj.weight": "model-00025-of-00092.safetensors",
+ "model.layers.24.self_attn.k_proj.weight_scale": "model-00025-of-00092.safetensors",
+ "model.layers.24.self_attn.o_proj.weight": "model-00025-of-00092.safetensors",
+ "model.layers.24.self_attn.o_proj.weight_scale": "model-00025-of-00092.safetensors",
+ "model.layers.24.self_attn.q_norm.weight": "model-00025-of-00092.safetensors",
+ "model.layers.24.self_attn.q_proj.bias": "model-00025-of-00092.safetensors",
+ "model.layers.24.self_attn.q_proj.weight": "model-00025-of-00092.safetensors",
+ "model.layers.24.self_attn.q_proj.weight_scale": "model-00025-of-00092.safetensors",
+ "model.layers.24.self_attn.v_proj.bias": "model-00025-of-00092.safetensors",
+ "model.layers.24.self_attn.v_proj.weight": "model-00025-of-00092.safetensors",
+ "model.layers.24.self_attn.v_proj.weight_scale": "model-00025-of-00092.safetensors",
+ "model.layers.25.input_layernorm.weight": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.0.down_proj.weight": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.0.down_proj.weight_scale": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.0.gate_proj.weight": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.0.gate_proj.weight_scale": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.0.up_proj.weight": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.0.up_proj.weight_scale": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.1.down_proj.weight": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.1.down_proj.weight_scale": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.1.gate_proj.weight": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.1.gate_proj.weight_scale": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.1.up_proj.weight": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.1.up_proj.weight_scale": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.10.down_proj.weight": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.10.down_proj.weight_scale": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.10.gate_proj.weight": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.10.gate_proj.weight_scale": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.10.up_proj.weight": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.10.up_proj.weight_scale": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.100.down_proj.weight": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.100.down_proj.weight_scale": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.100.gate_proj.weight": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.100.gate_proj.weight_scale": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.100.up_proj.weight": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.100.up_proj.weight_scale": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.101.down_proj.weight": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.101.down_proj.weight_scale": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.101.gate_proj.weight": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.101.gate_proj.weight_scale": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.101.up_proj.weight": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.101.up_proj.weight_scale": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.102.down_proj.weight": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.102.down_proj.weight_scale": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.102.gate_proj.weight": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.102.gate_proj.weight_scale": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.102.up_proj.weight": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.102.up_proj.weight_scale": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.103.down_proj.weight": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.103.down_proj.weight_scale": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.103.gate_proj.weight": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.103.gate_proj.weight_scale": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.103.up_proj.weight": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.103.up_proj.weight_scale": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.104.down_proj.weight": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.104.down_proj.weight_scale": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.104.gate_proj.weight": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.104.gate_proj.weight_scale": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.104.up_proj.weight": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.104.up_proj.weight_scale": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.105.down_proj.weight": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.105.down_proj.weight_scale": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.105.gate_proj.weight": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.105.gate_proj.weight_scale": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.105.up_proj.weight": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.105.up_proj.weight_scale": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.106.down_proj.weight": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.106.down_proj.weight_scale": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.106.gate_proj.weight": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.106.gate_proj.weight_scale": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.106.up_proj.weight": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.106.up_proj.weight_scale": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.107.down_proj.weight": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.107.down_proj.weight_scale": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.107.gate_proj.weight": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.107.gate_proj.weight_scale": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.107.up_proj.weight": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.107.up_proj.weight_scale": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.108.down_proj.weight": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.108.down_proj.weight_scale": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.108.gate_proj.weight": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.108.gate_proj.weight_scale": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.108.up_proj.weight": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.108.up_proj.weight_scale": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.109.down_proj.weight": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.109.down_proj.weight_scale": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.109.gate_proj.weight": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.109.gate_proj.weight_scale": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.109.up_proj.weight": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.109.up_proj.weight_scale": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.11.down_proj.weight": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.11.down_proj.weight_scale": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.11.gate_proj.weight": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.11.gate_proj.weight_scale": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.11.up_proj.weight": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.11.up_proj.weight_scale": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.110.down_proj.weight": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.110.down_proj.weight_scale": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.110.gate_proj.weight": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.110.gate_proj.weight_scale": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.110.up_proj.weight": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.110.up_proj.weight_scale": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.111.down_proj.weight": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.111.down_proj.weight_scale": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.111.gate_proj.weight": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.111.gate_proj.weight_scale": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.111.up_proj.weight": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.111.up_proj.weight_scale": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.112.down_proj.weight": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.112.down_proj.weight_scale": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.112.gate_proj.weight": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.112.gate_proj.weight_scale": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.112.up_proj.weight": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.112.up_proj.weight_scale": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.113.down_proj.weight": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.113.down_proj.weight_scale": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.113.gate_proj.weight": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.113.gate_proj.weight_scale": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.113.up_proj.weight": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.113.up_proj.weight_scale": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.114.down_proj.weight": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.114.down_proj.weight_scale": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.114.gate_proj.weight": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.114.gate_proj.weight_scale": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.114.up_proj.weight": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.114.up_proj.weight_scale": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.115.down_proj.weight": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.115.down_proj.weight_scale": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.115.gate_proj.weight": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.115.gate_proj.weight_scale": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.115.up_proj.weight": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.115.up_proj.weight_scale": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.116.down_proj.weight": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.116.down_proj.weight_scale": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.116.gate_proj.weight": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.116.gate_proj.weight_scale": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.116.up_proj.weight": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.116.up_proj.weight_scale": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.117.down_proj.weight": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.117.down_proj.weight_scale": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.117.gate_proj.weight": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.117.gate_proj.weight_scale": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.117.up_proj.weight": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.117.up_proj.weight_scale": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.118.down_proj.weight": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.118.down_proj.weight_scale": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.118.gate_proj.weight": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.118.gate_proj.weight_scale": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.118.up_proj.weight": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.118.up_proj.weight_scale": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.119.down_proj.weight": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.119.down_proj.weight_scale": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.119.gate_proj.weight": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.119.gate_proj.weight_scale": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.119.up_proj.weight": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.119.up_proj.weight_scale": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.12.down_proj.weight": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.12.down_proj.weight_scale": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.12.gate_proj.weight": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.12.gate_proj.weight_scale": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.12.up_proj.weight": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.12.up_proj.weight_scale": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.120.down_proj.weight": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.120.down_proj.weight_scale": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.120.gate_proj.weight": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.120.gate_proj.weight_scale": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.120.up_proj.weight": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.120.up_proj.weight_scale": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.121.down_proj.weight": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.121.down_proj.weight_scale": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.121.gate_proj.weight": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.121.gate_proj.weight_scale": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.121.up_proj.weight": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.121.up_proj.weight_scale": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.122.down_proj.weight": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.122.down_proj.weight_scale": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.122.gate_proj.weight": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.122.gate_proj.weight_scale": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.122.up_proj.weight": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.122.up_proj.weight_scale": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.123.down_proj.weight": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.123.down_proj.weight_scale": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.123.gate_proj.weight": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.123.gate_proj.weight_scale": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.123.up_proj.weight": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.123.up_proj.weight_scale": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.124.down_proj.weight": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.124.down_proj.weight_scale": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.124.gate_proj.weight": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.124.gate_proj.weight_scale": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.124.up_proj.weight": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.124.up_proj.weight_scale": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.125.down_proj.weight": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.125.down_proj.weight_scale": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.125.gate_proj.weight": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.125.gate_proj.weight_scale": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.125.up_proj.weight": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.125.up_proj.weight_scale": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.126.down_proj.weight": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.126.down_proj.weight_scale": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.126.gate_proj.weight": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.126.gate_proj.weight_scale": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.126.up_proj.weight": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.126.up_proj.weight_scale": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.127.down_proj.weight": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.127.down_proj.weight_scale": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.127.gate_proj.weight": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.127.gate_proj.weight_scale": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.127.up_proj.weight": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.127.up_proj.weight_scale": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.128.down_proj.weight": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.128.down_proj.weight_scale": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.128.gate_proj.weight": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.128.gate_proj.weight_scale": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.128.up_proj.weight": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.128.up_proj.weight_scale": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.129.down_proj.weight": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.129.down_proj.weight_scale": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.129.gate_proj.weight": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.129.gate_proj.weight_scale": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.129.up_proj.weight": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.129.up_proj.weight_scale": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.13.down_proj.weight": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.13.down_proj.weight_scale": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.13.gate_proj.weight": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.13.gate_proj.weight_scale": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.13.up_proj.weight": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.13.up_proj.weight_scale": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.130.down_proj.weight": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.130.down_proj.weight_scale": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.130.gate_proj.weight": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.130.gate_proj.weight_scale": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.130.up_proj.weight": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.130.up_proj.weight_scale": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.131.down_proj.weight": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.131.down_proj.weight_scale": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.131.gate_proj.weight": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.131.gate_proj.weight_scale": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.131.up_proj.weight": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.131.up_proj.weight_scale": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.132.down_proj.weight": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.132.down_proj.weight_scale": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.132.gate_proj.weight": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.132.gate_proj.weight_scale": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.132.up_proj.weight": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.132.up_proj.weight_scale": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.133.down_proj.weight": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.133.down_proj.weight_scale": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.133.gate_proj.weight": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.133.gate_proj.weight_scale": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.133.up_proj.weight": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.133.up_proj.weight_scale": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.134.down_proj.weight": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.134.down_proj.weight_scale": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.134.gate_proj.weight": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.134.gate_proj.weight_scale": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.134.up_proj.weight": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.134.up_proj.weight_scale": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.135.down_proj.weight": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.135.down_proj.weight_scale": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.135.gate_proj.weight": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.135.gate_proj.weight_scale": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.135.up_proj.weight": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.135.up_proj.weight_scale": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.136.down_proj.weight": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.136.down_proj.weight_scale": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.136.gate_proj.weight": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.136.gate_proj.weight_scale": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.136.up_proj.weight": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.136.up_proj.weight_scale": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.137.down_proj.weight": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.137.down_proj.weight_scale": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.137.gate_proj.weight": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.137.gate_proj.weight_scale": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.137.up_proj.weight": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.137.up_proj.weight_scale": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.138.down_proj.weight": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.138.down_proj.weight_scale": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.138.gate_proj.weight": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.138.gate_proj.weight_scale": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.138.up_proj.weight": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.138.up_proj.weight_scale": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.139.down_proj.weight": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.139.down_proj.weight_scale": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.139.gate_proj.weight": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.139.gate_proj.weight_scale": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.139.up_proj.weight": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.139.up_proj.weight_scale": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.14.down_proj.weight": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.14.down_proj.weight_scale": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.14.gate_proj.weight": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.14.gate_proj.weight_scale": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.14.up_proj.weight": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.14.up_proj.weight_scale": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.140.down_proj.weight": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.140.down_proj.weight_scale": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.140.gate_proj.weight": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.140.gate_proj.weight_scale": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.140.up_proj.weight": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.140.up_proj.weight_scale": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.141.down_proj.weight": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.141.down_proj.weight_scale": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.141.gate_proj.weight": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.141.gate_proj.weight_scale": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.141.up_proj.weight": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.141.up_proj.weight_scale": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.142.down_proj.weight": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.142.down_proj.weight_scale": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.142.gate_proj.weight": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.142.gate_proj.weight_scale": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.142.up_proj.weight": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.142.up_proj.weight_scale": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.143.down_proj.weight": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.143.down_proj.weight_scale": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.143.gate_proj.weight": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.143.gate_proj.weight_scale": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.143.up_proj.weight": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.143.up_proj.weight_scale": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.144.down_proj.weight": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.144.down_proj.weight_scale": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.144.gate_proj.weight": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.144.gate_proj.weight_scale": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.144.up_proj.weight": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.144.up_proj.weight_scale": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.145.down_proj.weight": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.145.down_proj.weight_scale": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.145.gate_proj.weight": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.145.gate_proj.weight_scale": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.145.up_proj.weight": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.145.up_proj.weight_scale": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.146.down_proj.weight": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.146.down_proj.weight_scale": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.146.gate_proj.weight": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.146.gate_proj.weight_scale": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.146.up_proj.weight": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.146.up_proj.weight_scale": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.147.down_proj.weight": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.147.down_proj.weight_scale": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.147.gate_proj.weight": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.147.gate_proj.weight_scale": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.147.up_proj.weight": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.147.up_proj.weight_scale": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.148.down_proj.weight": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.148.down_proj.weight_scale": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.148.gate_proj.weight": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.148.gate_proj.weight_scale": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.148.up_proj.weight": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.148.up_proj.weight_scale": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.149.down_proj.weight": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.149.down_proj.weight_scale": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.149.gate_proj.weight": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.149.gate_proj.weight_scale": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.149.up_proj.weight": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.149.up_proj.weight_scale": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.15.down_proj.weight": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.15.down_proj.weight_scale": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.15.gate_proj.weight": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.15.gate_proj.weight_scale": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.15.up_proj.weight": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.15.up_proj.weight_scale": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.150.down_proj.weight": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.150.down_proj.weight_scale": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.150.gate_proj.weight": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.150.gate_proj.weight_scale": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.150.up_proj.weight": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.150.up_proj.weight_scale": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.151.down_proj.weight": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.151.down_proj.weight_scale": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.151.gate_proj.weight": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.151.gate_proj.weight_scale": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.151.up_proj.weight": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.151.up_proj.weight_scale": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.152.down_proj.weight": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.152.down_proj.weight_scale": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.152.gate_proj.weight": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.152.gate_proj.weight_scale": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.152.up_proj.weight": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.152.up_proj.weight_scale": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.153.down_proj.weight": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.153.down_proj.weight_scale": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.153.gate_proj.weight": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.153.gate_proj.weight_scale": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.153.up_proj.weight": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.153.up_proj.weight_scale": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.154.down_proj.weight": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.154.down_proj.weight_scale": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.154.gate_proj.weight": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.154.gate_proj.weight_scale": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.154.up_proj.weight": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.154.up_proj.weight_scale": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.155.down_proj.weight": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.155.down_proj.weight_scale": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.155.gate_proj.weight": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.155.gate_proj.weight_scale": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.155.up_proj.weight": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.155.up_proj.weight_scale": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.156.down_proj.weight": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.156.down_proj.weight_scale": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.156.gate_proj.weight": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.156.gate_proj.weight_scale": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.156.up_proj.weight": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.156.up_proj.weight_scale": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.157.down_proj.weight": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.157.down_proj.weight_scale": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.157.gate_proj.weight": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.157.gate_proj.weight_scale": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.157.up_proj.weight": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.157.up_proj.weight_scale": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.158.down_proj.weight": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.158.down_proj.weight_scale": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.158.gate_proj.weight": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.158.gate_proj.weight_scale": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.158.up_proj.weight": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.158.up_proj.weight_scale": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.159.down_proj.weight": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.159.down_proj.weight_scale": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.159.gate_proj.weight": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.159.gate_proj.weight_scale": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.159.up_proj.weight": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.159.up_proj.weight_scale": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.16.down_proj.weight": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.16.down_proj.weight_scale": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.16.gate_proj.weight": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.16.gate_proj.weight_scale": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.16.up_proj.weight": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.16.up_proj.weight_scale": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.17.down_proj.weight": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.17.down_proj.weight_scale": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.17.gate_proj.weight": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.17.gate_proj.weight_scale": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.17.up_proj.weight": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.17.up_proj.weight_scale": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.18.down_proj.weight": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.18.down_proj.weight_scale": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.18.gate_proj.weight": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.18.gate_proj.weight_scale": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.18.up_proj.weight": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.18.up_proj.weight_scale": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.19.down_proj.weight": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.19.down_proj.weight_scale": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.19.gate_proj.weight": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.19.gate_proj.weight_scale": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.19.up_proj.weight": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.19.up_proj.weight_scale": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.2.down_proj.weight": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.2.down_proj.weight_scale": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.2.gate_proj.weight": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.2.gate_proj.weight_scale": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.2.up_proj.weight": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.2.up_proj.weight_scale": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.20.down_proj.weight": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.20.down_proj.weight_scale": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.20.gate_proj.weight": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.20.gate_proj.weight_scale": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.20.up_proj.weight": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.20.up_proj.weight_scale": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.21.down_proj.weight": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.21.down_proj.weight_scale": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.21.gate_proj.weight": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.21.gate_proj.weight_scale": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.21.up_proj.weight": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.21.up_proj.weight_scale": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.22.down_proj.weight": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.22.down_proj.weight_scale": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.22.gate_proj.weight": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.22.gate_proj.weight_scale": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.22.up_proj.weight": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.22.up_proj.weight_scale": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.23.down_proj.weight": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.23.down_proj.weight_scale": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.23.gate_proj.weight": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.23.gate_proj.weight_scale": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.23.up_proj.weight": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.23.up_proj.weight_scale": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.24.down_proj.weight": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.24.down_proj.weight_scale": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.24.gate_proj.weight": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.24.gate_proj.weight_scale": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.24.up_proj.weight": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.24.up_proj.weight_scale": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.25.down_proj.weight": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.25.down_proj.weight_scale": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.25.gate_proj.weight": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.25.gate_proj.weight_scale": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.25.up_proj.weight": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.25.up_proj.weight_scale": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.26.down_proj.weight": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.26.down_proj.weight_scale": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.26.gate_proj.weight": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.26.gate_proj.weight_scale": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.26.up_proj.weight": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.26.up_proj.weight_scale": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.27.down_proj.weight": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.27.down_proj.weight_scale": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.27.gate_proj.weight": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.27.gate_proj.weight_scale": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.27.up_proj.weight": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.27.up_proj.weight_scale": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.28.down_proj.weight": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.28.down_proj.weight_scale": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.28.gate_proj.weight": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.28.gate_proj.weight_scale": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.28.up_proj.weight": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.28.up_proj.weight_scale": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.29.down_proj.weight": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.29.down_proj.weight_scale": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.29.gate_proj.weight": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.29.gate_proj.weight_scale": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.29.up_proj.weight": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.29.up_proj.weight_scale": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.3.down_proj.weight": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.3.down_proj.weight_scale": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.3.gate_proj.weight": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.3.gate_proj.weight_scale": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.3.up_proj.weight": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.3.up_proj.weight_scale": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.30.down_proj.weight": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.30.down_proj.weight_scale": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.30.gate_proj.weight": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.30.gate_proj.weight_scale": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.30.up_proj.weight": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.30.up_proj.weight_scale": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.31.down_proj.weight": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.31.down_proj.weight_scale": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.31.gate_proj.weight": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.31.gate_proj.weight_scale": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.31.up_proj.weight": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.31.up_proj.weight_scale": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.32.down_proj.weight": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.32.down_proj.weight_scale": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.32.gate_proj.weight": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.32.gate_proj.weight_scale": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.32.up_proj.weight": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.32.up_proj.weight_scale": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.33.down_proj.weight": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.33.down_proj.weight_scale": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.33.gate_proj.weight": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.33.gate_proj.weight_scale": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.33.up_proj.weight": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.33.up_proj.weight_scale": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.34.down_proj.weight": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.34.down_proj.weight_scale": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.34.gate_proj.weight": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.34.gate_proj.weight_scale": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.34.up_proj.weight": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.34.up_proj.weight_scale": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.35.down_proj.weight": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.35.down_proj.weight_scale": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.35.gate_proj.weight": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.35.gate_proj.weight_scale": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.35.up_proj.weight": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.35.up_proj.weight_scale": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.36.down_proj.weight": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.36.down_proj.weight_scale": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.36.gate_proj.weight": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.36.gate_proj.weight_scale": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.36.up_proj.weight": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.36.up_proj.weight_scale": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.37.down_proj.weight": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.37.down_proj.weight_scale": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.37.gate_proj.weight": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.37.gate_proj.weight_scale": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.37.up_proj.weight": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.37.up_proj.weight_scale": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.38.down_proj.weight": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.38.down_proj.weight_scale": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.38.gate_proj.weight": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.38.gate_proj.weight_scale": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.38.up_proj.weight": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.38.up_proj.weight_scale": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.39.down_proj.weight": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.39.down_proj.weight_scale": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.39.gate_proj.weight": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.39.gate_proj.weight_scale": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.39.up_proj.weight": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.39.up_proj.weight_scale": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.4.down_proj.weight": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.4.down_proj.weight_scale": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.4.gate_proj.weight": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.4.gate_proj.weight_scale": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.4.up_proj.weight": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.4.up_proj.weight_scale": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.40.down_proj.weight": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.40.down_proj.weight_scale": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.40.gate_proj.weight": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.40.gate_proj.weight_scale": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.40.up_proj.weight": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.40.up_proj.weight_scale": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.41.down_proj.weight": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.41.down_proj.weight_scale": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.41.gate_proj.weight": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.41.gate_proj.weight_scale": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.41.up_proj.weight": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.41.up_proj.weight_scale": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.42.down_proj.weight": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.42.down_proj.weight_scale": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.42.gate_proj.weight": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.42.gate_proj.weight_scale": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.42.up_proj.weight": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.42.up_proj.weight_scale": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.43.down_proj.weight": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.43.down_proj.weight_scale": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.43.gate_proj.weight": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.43.gate_proj.weight_scale": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.43.up_proj.weight": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.43.up_proj.weight_scale": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.44.down_proj.weight": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.44.down_proj.weight_scale": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.44.gate_proj.weight": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.44.gate_proj.weight_scale": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.44.up_proj.weight": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.44.up_proj.weight_scale": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.45.down_proj.weight": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.45.down_proj.weight_scale": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.45.gate_proj.weight": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.45.gate_proj.weight_scale": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.45.up_proj.weight": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.45.up_proj.weight_scale": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.46.down_proj.weight": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.46.down_proj.weight_scale": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.46.gate_proj.weight": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.46.gate_proj.weight_scale": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.46.up_proj.weight": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.46.up_proj.weight_scale": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.47.down_proj.weight": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.47.down_proj.weight_scale": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.47.gate_proj.weight": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.47.gate_proj.weight_scale": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.47.up_proj.weight": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.47.up_proj.weight_scale": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.48.down_proj.weight": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.48.down_proj.weight_scale": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.48.gate_proj.weight": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.48.gate_proj.weight_scale": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.48.up_proj.weight": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.48.up_proj.weight_scale": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.49.down_proj.weight": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.49.down_proj.weight_scale": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.49.gate_proj.weight": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.49.gate_proj.weight_scale": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.49.up_proj.weight": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.49.up_proj.weight_scale": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.5.down_proj.weight": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.5.down_proj.weight_scale": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.5.gate_proj.weight": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.5.gate_proj.weight_scale": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.5.up_proj.weight": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.5.up_proj.weight_scale": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.50.down_proj.weight": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.50.down_proj.weight_scale": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.50.gate_proj.weight": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.50.gate_proj.weight_scale": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.50.up_proj.weight": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.50.up_proj.weight_scale": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.51.down_proj.weight": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.51.down_proj.weight_scale": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.51.gate_proj.weight": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.51.gate_proj.weight_scale": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.51.up_proj.weight": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.51.up_proj.weight_scale": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.52.down_proj.weight": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.52.down_proj.weight_scale": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.52.gate_proj.weight": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.52.gate_proj.weight_scale": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.52.up_proj.weight": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.52.up_proj.weight_scale": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.53.down_proj.weight": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.53.down_proj.weight_scale": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.53.gate_proj.weight": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.53.gate_proj.weight_scale": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.53.up_proj.weight": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.53.up_proj.weight_scale": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.54.down_proj.weight": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.54.down_proj.weight_scale": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.54.gate_proj.weight": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.54.gate_proj.weight_scale": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.54.up_proj.weight": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.54.up_proj.weight_scale": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.55.down_proj.weight": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.55.down_proj.weight_scale": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.55.gate_proj.weight": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.55.gate_proj.weight_scale": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.55.up_proj.weight": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.55.up_proj.weight_scale": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.56.down_proj.weight": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.56.down_proj.weight_scale": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.56.gate_proj.weight": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.56.gate_proj.weight_scale": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.56.up_proj.weight": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.56.up_proj.weight_scale": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.57.down_proj.weight": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.57.down_proj.weight_scale": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.57.gate_proj.weight": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.57.gate_proj.weight_scale": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.57.up_proj.weight": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.57.up_proj.weight_scale": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.58.down_proj.weight": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.58.down_proj.weight_scale": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.58.gate_proj.weight": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.58.gate_proj.weight_scale": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.58.up_proj.weight": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.58.up_proj.weight_scale": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.59.down_proj.weight": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.59.down_proj.weight_scale": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.59.gate_proj.weight": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.59.gate_proj.weight_scale": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.59.up_proj.weight": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.59.up_proj.weight_scale": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.6.down_proj.weight": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.6.down_proj.weight_scale": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.6.gate_proj.weight": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.6.gate_proj.weight_scale": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.6.up_proj.weight": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.6.up_proj.weight_scale": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.60.down_proj.weight": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.60.down_proj.weight_scale": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.60.gate_proj.weight": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.60.gate_proj.weight_scale": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.60.up_proj.weight": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.60.up_proj.weight_scale": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.61.down_proj.weight": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.61.down_proj.weight_scale": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.61.gate_proj.weight": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.61.gate_proj.weight_scale": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.61.up_proj.weight": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.61.up_proj.weight_scale": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.62.down_proj.weight": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.62.down_proj.weight_scale": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.62.gate_proj.weight": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.62.gate_proj.weight_scale": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.62.up_proj.weight": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.62.up_proj.weight_scale": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.63.down_proj.weight": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.63.down_proj.weight_scale": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.63.gate_proj.weight": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.63.gate_proj.weight_scale": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.63.up_proj.weight": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.63.up_proj.weight_scale": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.64.down_proj.weight": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.64.down_proj.weight_scale": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.64.gate_proj.weight": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.64.gate_proj.weight_scale": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.64.up_proj.weight": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.64.up_proj.weight_scale": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.65.down_proj.weight": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.65.down_proj.weight_scale": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.65.gate_proj.weight": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.65.gate_proj.weight_scale": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.65.up_proj.weight": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.65.up_proj.weight_scale": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.66.down_proj.weight": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.66.down_proj.weight_scale": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.66.gate_proj.weight": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.66.gate_proj.weight_scale": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.66.up_proj.weight": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.66.up_proj.weight_scale": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.67.down_proj.weight": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.67.down_proj.weight_scale": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.67.gate_proj.weight": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.67.gate_proj.weight_scale": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.67.up_proj.weight": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.67.up_proj.weight_scale": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.68.down_proj.weight": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.68.down_proj.weight_scale": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.68.gate_proj.weight": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.68.gate_proj.weight_scale": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.68.up_proj.weight": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.68.up_proj.weight_scale": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.69.down_proj.weight": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.69.down_proj.weight_scale": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.69.gate_proj.weight": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.69.gate_proj.weight_scale": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.69.up_proj.weight": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.69.up_proj.weight_scale": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.7.down_proj.weight": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.7.down_proj.weight_scale": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.7.gate_proj.weight": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.7.gate_proj.weight_scale": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.7.up_proj.weight": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.7.up_proj.weight_scale": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.70.down_proj.weight": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.70.down_proj.weight_scale": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.70.gate_proj.weight": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.70.gate_proj.weight_scale": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.70.up_proj.weight": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.70.up_proj.weight_scale": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.71.down_proj.weight": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.71.down_proj.weight_scale": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.71.gate_proj.weight": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.71.gate_proj.weight_scale": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.71.up_proj.weight": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.71.up_proj.weight_scale": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.72.down_proj.weight": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.72.down_proj.weight_scale": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.72.gate_proj.weight": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.72.gate_proj.weight_scale": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.72.up_proj.weight": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.72.up_proj.weight_scale": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.73.down_proj.weight": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.73.down_proj.weight_scale": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.73.gate_proj.weight": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.73.gate_proj.weight_scale": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.73.up_proj.weight": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.73.up_proj.weight_scale": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.74.down_proj.weight": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.74.down_proj.weight_scale": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.74.gate_proj.weight": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.74.gate_proj.weight_scale": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.74.up_proj.weight": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.74.up_proj.weight_scale": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.75.down_proj.weight": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.75.down_proj.weight_scale": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.75.gate_proj.weight": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.75.gate_proj.weight_scale": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.75.up_proj.weight": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.75.up_proj.weight_scale": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.76.down_proj.weight": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.76.down_proj.weight_scale": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.76.gate_proj.weight": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.76.gate_proj.weight_scale": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.76.up_proj.weight": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.76.up_proj.weight_scale": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.77.down_proj.weight": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.77.down_proj.weight_scale": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.77.gate_proj.weight": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.77.gate_proj.weight_scale": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.77.up_proj.weight": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.77.up_proj.weight_scale": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.78.down_proj.weight": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.78.down_proj.weight_scale": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.78.gate_proj.weight": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.78.gate_proj.weight_scale": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.78.up_proj.weight": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.78.up_proj.weight_scale": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.79.down_proj.weight": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.79.down_proj.weight_scale": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.79.gate_proj.weight": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.79.gate_proj.weight_scale": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.79.up_proj.weight": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.79.up_proj.weight_scale": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.8.down_proj.weight": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.8.down_proj.weight_scale": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.8.gate_proj.weight": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.8.gate_proj.weight_scale": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.8.up_proj.weight": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.8.up_proj.weight_scale": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.80.down_proj.weight": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.80.down_proj.weight_scale": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.80.gate_proj.weight": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.80.gate_proj.weight_scale": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.80.up_proj.weight": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.80.up_proj.weight_scale": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.81.down_proj.weight": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.81.down_proj.weight_scale": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.81.gate_proj.weight": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.81.gate_proj.weight_scale": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.81.up_proj.weight": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.81.up_proj.weight_scale": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.82.down_proj.weight": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.82.down_proj.weight_scale": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.82.gate_proj.weight": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.82.gate_proj.weight_scale": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.82.up_proj.weight": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.82.up_proj.weight_scale": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.83.down_proj.weight": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.83.down_proj.weight_scale": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.83.gate_proj.weight": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.83.gate_proj.weight_scale": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.83.up_proj.weight": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.83.up_proj.weight_scale": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.84.down_proj.weight": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.84.down_proj.weight_scale": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.84.gate_proj.weight": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.84.gate_proj.weight_scale": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.84.up_proj.weight": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.84.up_proj.weight_scale": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.85.down_proj.weight": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.85.down_proj.weight_scale": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.85.gate_proj.weight": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.85.gate_proj.weight_scale": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.85.up_proj.weight": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.85.up_proj.weight_scale": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.86.down_proj.weight": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.86.down_proj.weight_scale": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.86.gate_proj.weight": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.86.gate_proj.weight_scale": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.86.up_proj.weight": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.86.up_proj.weight_scale": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.87.down_proj.weight": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.87.down_proj.weight_scale": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.87.gate_proj.weight": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.87.gate_proj.weight_scale": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.87.up_proj.weight": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.87.up_proj.weight_scale": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.88.down_proj.weight": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.88.down_proj.weight_scale": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.88.gate_proj.weight": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.88.gate_proj.weight_scale": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.88.up_proj.weight": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.88.up_proj.weight_scale": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.89.down_proj.weight": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.89.down_proj.weight_scale": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.89.gate_proj.weight": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.89.gate_proj.weight_scale": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.89.up_proj.weight": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.89.up_proj.weight_scale": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.9.down_proj.weight": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.9.down_proj.weight_scale": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.9.gate_proj.weight": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.9.gate_proj.weight_scale": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.9.up_proj.weight": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.9.up_proj.weight_scale": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.90.down_proj.weight": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.90.down_proj.weight_scale": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.90.gate_proj.weight": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.90.gate_proj.weight_scale": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.90.up_proj.weight": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.90.up_proj.weight_scale": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.91.down_proj.weight": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.91.down_proj.weight_scale": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.91.gate_proj.weight": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.91.gate_proj.weight_scale": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.91.up_proj.weight": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.91.up_proj.weight_scale": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.92.down_proj.weight": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.92.down_proj.weight_scale": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.92.gate_proj.weight": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.92.gate_proj.weight_scale": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.92.up_proj.weight": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.92.up_proj.weight_scale": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.93.down_proj.weight": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.93.down_proj.weight_scale": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.93.gate_proj.weight": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.93.gate_proj.weight_scale": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.93.up_proj.weight": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.93.up_proj.weight_scale": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.94.down_proj.weight": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.94.down_proj.weight_scale": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.94.gate_proj.weight": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.94.gate_proj.weight_scale": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.94.up_proj.weight": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.94.up_proj.weight_scale": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.95.down_proj.weight": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.95.down_proj.weight_scale": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.95.gate_proj.weight": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.95.gate_proj.weight_scale": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.95.up_proj.weight": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.95.up_proj.weight_scale": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.96.down_proj.weight": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.96.down_proj.weight_scale": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.96.gate_proj.weight": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.96.gate_proj.weight_scale": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.96.up_proj.weight": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.96.up_proj.weight_scale": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.97.down_proj.weight": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.97.down_proj.weight_scale": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.97.gate_proj.weight": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.97.gate_proj.weight_scale": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.97.up_proj.weight": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.97.up_proj.weight_scale": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.98.down_proj.weight": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.98.down_proj.weight_scale": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.98.gate_proj.weight": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.98.gate_proj.weight_scale": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.98.up_proj.weight": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.98.up_proj.weight_scale": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.99.down_proj.weight": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.99.down_proj.weight_scale": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.99.gate_proj.weight": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.99.gate_proj.weight_scale": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.99.up_proj.weight": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.99.up_proj.weight_scale": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.gate.e_score_correction_bias": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.gate.weight": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.shared_experts.down_proj.weight": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.shared_experts.down_proj.weight_scale": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.shared_experts.gate_proj.weight": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.shared_experts.gate_proj.weight_scale": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.shared_experts.up_proj.weight": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.shared_experts.up_proj.weight_scale": "model-00026-of-00092.safetensors",
+ "model.layers.25.post_attention_layernorm.weight": "model-00026-of-00092.safetensors",
+ "model.layers.25.self_attn.k_norm.weight": "model-00026-of-00092.safetensors",
+ "model.layers.25.self_attn.k_proj.bias": "model-00026-of-00092.safetensors",
+ "model.layers.25.self_attn.k_proj.weight": "model-00026-of-00092.safetensors",
+ "model.layers.25.self_attn.k_proj.weight_scale": "model-00026-of-00092.safetensors",
+ "model.layers.25.self_attn.o_proj.weight": "model-00026-of-00092.safetensors",
+ "model.layers.25.self_attn.o_proj.weight_scale": "model-00026-of-00092.safetensors",
+ "model.layers.25.self_attn.q_norm.weight": "model-00026-of-00092.safetensors",
+ "model.layers.25.self_attn.q_proj.bias": "model-00026-of-00092.safetensors",
+ "model.layers.25.self_attn.q_proj.weight": "model-00026-of-00092.safetensors",
+ "model.layers.25.self_attn.q_proj.weight_scale": "model-00026-of-00092.safetensors",
+ "model.layers.25.self_attn.v_proj.bias": "model-00026-of-00092.safetensors",
+ "model.layers.25.self_attn.v_proj.weight": "model-00026-of-00092.safetensors",
+ "model.layers.25.self_attn.v_proj.weight_scale": "model-00026-of-00092.safetensors",
+ "model.layers.26.input_layernorm.weight": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.0.down_proj.weight": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.0.down_proj.weight_scale": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.0.gate_proj.weight": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.0.gate_proj.weight_scale": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.0.up_proj.weight": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.0.up_proj.weight_scale": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.1.down_proj.weight": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.1.down_proj.weight_scale": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.1.gate_proj.weight": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.1.gate_proj.weight_scale": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.1.up_proj.weight": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.1.up_proj.weight_scale": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.10.down_proj.weight": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.10.down_proj.weight_scale": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.10.gate_proj.weight": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.10.gate_proj.weight_scale": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.10.up_proj.weight": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.10.up_proj.weight_scale": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.100.down_proj.weight": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.100.down_proj.weight_scale": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.100.gate_proj.weight": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.100.gate_proj.weight_scale": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.100.up_proj.weight": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.100.up_proj.weight_scale": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.101.down_proj.weight": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.101.down_proj.weight_scale": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.101.gate_proj.weight": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.101.gate_proj.weight_scale": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.101.up_proj.weight": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.101.up_proj.weight_scale": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.102.down_proj.weight": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.102.down_proj.weight_scale": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.102.gate_proj.weight": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.102.gate_proj.weight_scale": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.102.up_proj.weight": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.102.up_proj.weight_scale": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.103.down_proj.weight": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.103.down_proj.weight_scale": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.103.gate_proj.weight": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.103.gate_proj.weight_scale": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.103.up_proj.weight": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.103.up_proj.weight_scale": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.104.down_proj.weight": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.104.down_proj.weight_scale": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.104.gate_proj.weight": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.104.gate_proj.weight_scale": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.104.up_proj.weight": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.104.up_proj.weight_scale": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.105.down_proj.weight": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.105.down_proj.weight_scale": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.105.gate_proj.weight": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.105.gate_proj.weight_scale": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.105.up_proj.weight": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.105.up_proj.weight_scale": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.106.down_proj.weight": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.106.down_proj.weight_scale": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.106.gate_proj.weight": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.106.gate_proj.weight_scale": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.106.up_proj.weight": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.106.up_proj.weight_scale": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.107.down_proj.weight": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.107.down_proj.weight_scale": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.107.gate_proj.weight": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.107.gate_proj.weight_scale": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.107.up_proj.weight": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.107.up_proj.weight_scale": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.108.down_proj.weight": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.108.down_proj.weight_scale": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.108.gate_proj.weight": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.108.gate_proj.weight_scale": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.108.up_proj.weight": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.108.up_proj.weight_scale": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.109.down_proj.weight": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.109.down_proj.weight_scale": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.109.gate_proj.weight": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.109.gate_proj.weight_scale": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.109.up_proj.weight": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.109.up_proj.weight_scale": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.11.down_proj.weight": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.11.down_proj.weight_scale": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.11.gate_proj.weight": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.11.gate_proj.weight_scale": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.11.up_proj.weight": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.11.up_proj.weight_scale": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.110.down_proj.weight": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.110.down_proj.weight_scale": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.110.gate_proj.weight": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.110.gate_proj.weight_scale": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.110.up_proj.weight": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.110.up_proj.weight_scale": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.111.down_proj.weight": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.111.down_proj.weight_scale": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.111.gate_proj.weight": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.111.gate_proj.weight_scale": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.111.up_proj.weight": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.111.up_proj.weight_scale": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.112.down_proj.weight": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.112.down_proj.weight_scale": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.112.gate_proj.weight": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.112.gate_proj.weight_scale": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.112.up_proj.weight": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.112.up_proj.weight_scale": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.113.down_proj.weight": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.113.down_proj.weight_scale": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.113.gate_proj.weight": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.113.gate_proj.weight_scale": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.113.up_proj.weight": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.113.up_proj.weight_scale": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.114.down_proj.weight": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.114.down_proj.weight_scale": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.114.gate_proj.weight": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.114.gate_proj.weight_scale": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.114.up_proj.weight": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.114.up_proj.weight_scale": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.115.down_proj.weight": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.115.down_proj.weight_scale": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.115.gate_proj.weight": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.115.gate_proj.weight_scale": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.115.up_proj.weight": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.115.up_proj.weight_scale": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.116.down_proj.weight": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.116.down_proj.weight_scale": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.116.gate_proj.weight": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.116.gate_proj.weight_scale": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.116.up_proj.weight": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.116.up_proj.weight_scale": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.117.down_proj.weight": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.117.down_proj.weight_scale": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.117.gate_proj.weight": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.117.gate_proj.weight_scale": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.117.up_proj.weight": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.117.up_proj.weight_scale": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.118.down_proj.weight": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.118.down_proj.weight_scale": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.118.gate_proj.weight": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.118.gate_proj.weight_scale": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.118.up_proj.weight": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.118.up_proj.weight_scale": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.119.down_proj.weight": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.119.down_proj.weight_scale": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.119.gate_proj.weight": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.119.gate_proj.weight_scale": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.119.up_proj.weight": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.119.up_proj.weight_scale": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.12.down_proj.weight": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.12.down_proj.weight_scale": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.12.gate_proj.weight": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.12.gate_proj.weight_scale": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.12.up_proj.weight": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.12.up_proj.weight_scale": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.120.down_proj.weight": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.120.down_proj.weight_scale": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.120.gate_proj.weight": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.120.gate_proj.weight_scale": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.120.up_proj.weight": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.120.up_proj.weight_scale": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.121.down_proj.weight": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.121.down_proj.weight_scale": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.121.gate_proj.weight": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.121.gate_proj.weight_scale": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.121.up_proj.weight": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.121.up_proj.weight_scale": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.122.down_proj.weight": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.122.down_proj.weight_scale": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.122.gate_proj.weight": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.122.gate_proj.weight_scale": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.122.up_proj.weight": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.122.up_proj.weight_scale": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.123.down_proj.weight": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.123.down_proj.weight_scale": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.123.gate_proj.weight": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.123.gate_proj.weight_scale": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.123.up_proj.weight": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.123.up_proj.weight_scale": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.124.down_proj.weight": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.124.down_proj.weight_scale": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.124.gate_proj.weight": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.124.gate_proj.weight_scale": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.124.up_proj.weight": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.124.up_proj.weight_scale": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.125.down_proj.weight": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.125.down_proj.weight_scale": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.125.gate_proj.weight": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.125.gate_proj.weight_scale": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.125.up_proj.weight": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.125.up_proj.weight_scale": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.126.down_proj.weight": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.126.down_proj.weight_scale": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.126.gate_proj.weight": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.126.gate_proj.weight_scale": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.126.up_proj.weight": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.126.up_proj.weight_scale": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.127.down_proj.weight": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.127.down_proj.weight_scale": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.127.gate_proj.weight": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.127.gate_proj.weight_scale": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.127.up_proj.weight": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.127.up_proj.weight_scale": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.128.down_proj.weight": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.128.down_proj.weight_scale": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.128.gate_proj.weight": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.128.gate_proj.weight_scale": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.128.up_proj.weight": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.128.up_proj.weight_scale": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.129.down_proj.weight": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.129.down_proj.weight_scale": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.129.gate_proj.weight": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.129.gate_proj.weight_scale": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.129.up_proj.weight": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.129.up_proj.weight_scale": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.13.down_proj.weight": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.13.down_proj.weight_scale": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.13.gate_proj.weight": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.13.gate_proj.weight_scale": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.13.up_proj.weight": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.13.up_proj.weight_scale": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.130.down_proj.weight": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.130.down_proj.weight_scale": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.130.gate_proj.weight": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.130.gate_proj.weight_scale": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.130.up_proj.weight": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.130.up_proj.weight_scale": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.131.down_proj.weight": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.131.down_proj.weight_scale": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.131.gate_proj.weight": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.131.gate_proj.weight_scale": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.131.up_proj.weight": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.131.up_proj.weight_scale": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.132.down_proj.weight": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.132.down_proj.weight_scale": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.132.gate_proj.weight": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.132.gate_proj.weight_scale": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.132.up_proj.weight": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.132.up_proj.weight_scale": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.133.down_proj.weight": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.133.down_proj.weight_scale": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.133.gate_proj.weight": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.133.gate_proj.weight_scale": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.133.up_proj.weight": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.133.up_proj.weight_scale": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.134.down_proj.weight": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.134.down_proj.weight_scale": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.134.gate_proj.weight": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.134.gate_proj.weight_scale": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.134.up_proj.weight": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.134.up_proj.weight_scale": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.135.down_proj.weight": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.135.down_proj.weight_scale": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.135.gate_proj.weight": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.135.gate_proj.weight_scale": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.135.up_proj.weight": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.135.up_proj.weight_scale": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.136.down_proj.weight": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.136.down_proj.weight_scale": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.136.gate_proj.weight": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.136.gate_proj.weight_scale": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.136.up_proj.weight": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.136.up_proj.weight_scale": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.137.down_proj.weight": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.137.down_proj.weight_scale": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.137.gate_proj.weight": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.137.gate_proj.weight_scale": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.137.up_proj.weight": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.137.up_proj.weight_scale": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.138.down_proj.weight": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.138.down_proj.weight_scale": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.138.gate_proj.weight": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.138.gate_proj.weight_scale": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.138.up_proj.weight": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.138.up_proj.weight_scale": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.139.down_proj.weight": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.139.down_proj.weight_scale": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.139.gate_proj.weight": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.139.gate_proj.weight_scale": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.139.up_proj.weight": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.139.up_proj.weight_scale": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.14.down_proj.weight": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.14.down_proj.weight_scale": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.14.gate_proj.weight": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.14.gate_proj.weight_scale": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.14.up_proj.weight": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.14.up_proj.weight_scale": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.140.down_proj.weight": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.140.down_proj.weight_scale": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.140.gate_proj.weight": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.140.gate_proj.weight_scale": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.140.up_proj.weight": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.140.up_proj.weight_scale": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.141.down_proj.weight": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.141.down_proj.weight_scale": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.141.gate_proj.weight": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.141.gate_proj.weight_scale": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.141.up_proj.weight": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.141.up_proj.weight_scale": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.142.down_proj.weight": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.142.down_proj.weight_scale": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.142.gate_proj.weight": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.142.gate_proj.weight_scale": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.142.up_proj.weight": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.142.up_proj.weight_scale": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.143.down_proj.weight": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.143.down_proj.weight_scale": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.143.gate_proj.weight": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.143.gate_proj.weight_scale": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.143.up_proj.weight": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.143.up_proj.weight_scale": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.144.down_proj.weight": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.144.down_proj.weight_scale": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.144.gate_proj.weight": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.144.gate_proj.weight_scale": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.144.up_proj.weight": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.144.up_proj.weight_scale": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.145.down_proj.weight": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.145.down_proj.weight_scale": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.145.gate_proj.weight": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.145.gate_proj.weight_scale": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.145.up_proj.weight": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.145.up_proj.weight_scale": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.146.down_proj.weight": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.146.down_proj.weight_scale": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.146.gate_proj.weight": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.146.gate_proj.weight_scale": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.146.up_proj.weight": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.146.up_proj.weight_scale": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.147.down_proj.weight": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.147.down_proj.weight_scale": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.147.gate_proj.weight": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.147.gate_proj.weight_scale": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.147.up_proj.weight": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.147.up_proj.weight_scale": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.148.down_proj.weight": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.148.down_proj.weight_scale": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.148.gate_proj.weight": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.148.gate_proj.weight_scale": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.148.up_proj.weight": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.148.up_proj.weight_scale": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.149.down_proj.weight": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.149.down_proj.weight_scale": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.149.gate_proj.weight": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.149.gate_proj.weight_scale": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.149.up_proj.weight": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.149.up_proj.weight_scale": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.15.down_proj.weight": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.15.down_proj.weight_scale": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.15.gate_proj.weight": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.15.gate_proj.weight_scale": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.15.up_proj.weight": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.15.up_proj.weight_scale": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.150.down_proj.weight": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.150.down_proj.weight_scale": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.150.gate_proj.weight": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.150.gate_proj.weight_scale": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.150.up_proj.weight": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.150.up_proj.weight_scale": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.151.down_proj.weight": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.151.down_proj.weight_scale": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.151.gate_proj.weight": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.151.gate_proj.weight_scale": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.151.up_proj.weight": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.151.up_proj.weight_scale": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.152.down_proj.weight": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.152.down_proj.weight_scale": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.152.gate_proj.weight": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.152.gate_proj.weight_scale": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.152.up_proj.weight": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.152.up_proj.weight_scale": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.153.down_proj.weight": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.153.down_proj.weight_scale": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.153.gate_proj.weight": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.153.gate_proj.weight_scale": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.153.up_proj.weight": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.153.up_proj.weight_scale": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.154.down_proj.weight": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.154.down_proj.weight_scale": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.154.gate_proj.weight": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.154.gate_proj.weight_scale": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.154.up_proj.weight": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.154.up_proj.weight_scale": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.155.down_proj.weight": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.155.down_proj.weight_scale": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.155.gate_proj.weight": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.155.gate_proj.weight_scale": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.155.up_proj.weight": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.155.up_proj.weight_scale": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.156.down_proj.weight": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.156.down_proj.weight_scale": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.156.gate_proj.weight": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.156.gate_proj.weight_scale": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.156.up_proj.weight": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.156.up_proj.weight_scale": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.157.down_proj.weight": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.157.down_proj.weight_scale": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.157.gate_proj.weight": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.157.gate_proj.weight_scale": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.157.up_proj.weight": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.157.up_proj.weight_scale": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.158.down_proj.weight": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.158.down_proj.weight_scale": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.158.gate_proj.weight": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.158.gate_proj.weight_scale": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.158.up_proj.weight": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.158.up_proj.weight_scale": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.159.down_proj.weight": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.159.down_proj.weight_scale": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.159.gate_proj.weight": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.159.gate_proj.weight_scale": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.159.up_proj.weight": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.159.up_proj.weight_scale": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.16.down_proj.weight": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.16.down_proj.weight_scale": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.16.gate_proj.weight": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.16.gate_proj.weight_scale": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.16.up_proj.weight": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.16.up_proj.weight_scale": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.17.down_proj.weight": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.17.down_proj.weight_scale": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.17.gate_proj.weight": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.17.gate_proj.weight_scale": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.17.up_proj.weight": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.17.up_proj.weight_scale": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.18.down_proj.weight": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.18.down_proj.weight_scale": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.18.gate_proj.weight": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.18.gate_proj.weight_scale": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.18.up_proj.weight": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.18.up_proj.weight_scale": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.19.down_proj.weight": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.19.down_proj.weight_scale": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.19.gate_proj.weight": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.19.gate_proj.weight_scale": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.19.up_proj.weight": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.19.up_proj.weight_scale": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.2.down_proj.weight": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.2.down_proj.weight_scale": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.2.gate_proj.weight": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.2.gate_proj.weight_scale": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.2.up_proj.weight": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.2.up_proj.weight_scale": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.20.down_proj.weight": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.20.down_proj.weight_scale": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.20.gate_proj.weight": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.20.gate_proj.weight_scale": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.20.up_proj.weight": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.20.up_proj.weight_scale": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.21.down_proj.weight": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.21.down_proj.weight_scale": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.21.gate_proj.weight": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.21.gate_proj.weight_scale": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.21.up_proj.weight": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.21.up_proj.weight_scale": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.22.down_proj.weight": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.22.down_proj.weight_scale": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.22.gate_proj.weight": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.22.gate_proj.weight_scale": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.22.up_proj.weight": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.22.up_proj.weight_scale": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.23.down_proj.weight": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.23.down_proj.weight_scale": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.23.gate_proj.weight": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.23.gate_proj.weight_scale": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.23.up_proj.weight": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.23.up_proj.weight_scale": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.24.down_proj.weight": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.24.down_proj.weight_scale": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.24.gate_proj.weight": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.24.gate_proj.weight_scale": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.24.up_proj.weight": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.24.up_proj.weight_scale": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.25.down_proj.weight": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.25.down_proj.weight_scale": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.25.gate_proj.weight": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.25.gate_proj.weight_scale": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.25.up_proj.weight": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.25.up_proj.weight_scale": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.26.down_proj.weight": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.26.down_proj.weight_scale": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.26.gate_proj.weight": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.26.gate_proj.weight_scale": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.26.up_proj.weight": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.26.up_proj.weight_scale": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.27.down_proj.weight": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.27.down_proj.weight_scale": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.27.gate_proj.weight": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.27.gate_proj.weight_scale": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.27.up_proj.weight": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.27.up_proj.weight_scale": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.28.down_proj.weight": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.28.down_proj.weight_scale": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.28.gate_proj.weight": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.28.gate_proj.weight_scale": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.28.up_proj.weight": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.28.up_proj.weight_scale": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.29.down_proj.weight": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.29.down_proj.weight_scale": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.29.gate_proj.weight": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.29.gate_proj.weight_scale": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.29.up_proj.weight": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.29.up_proj.weight_scale": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.3.down_proj.weight": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.3.down_proj.weight_scale": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.3.gate_proj.weight": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.3.gate_proj.weight_scale": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.3.up_proj.weight": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.3.up_proj.weight_scale": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.30.down_proj.weight": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.30.down_proj.weight_scale": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.30.gate_proj.weight": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.30.gate_proj.weight_scale": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.30.up_proj.weight": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.30.up_proj.weight_scale": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.31.down_proj.weight": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.31.down_proj.weight_scale": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.31.gate_proj.weight": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.31.gate_proj.weight_scale": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.31.up_proj.weight": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.31.up_proj.weight_scale": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.32.down_proj.weight": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.32.down_proj.weight_scale": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.32.gate_proj.weight": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.32.gate_proj.weight_scale": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.32.up_proj.weight": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.32.up_proj.weight_scale": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.33.down_proj.weight": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.33.down_proj.weight_scale": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.33.gate_proj.weight": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.33.gate_proj.weight_scale": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.33.up_proj.weight": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.33.up_proj.weight_scale": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.34.down_proj.weight": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.34.down_proj.weight_scale": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.34.gate_proj.weight": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.34.gate_proj.weight_scale": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.34.up_proj.weight": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.34.up_proj.weight_scale": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.35.down_proj.weight": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.35.down_proj.weight_scale": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.35.gate_proj.weight": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.35.gate_proj.weight_scale": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.35.up_proj.weight": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.35.up_proj.weight_scale": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.36.down_proj.weight": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.36.down_proj.weight_scale": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.36.gate_proj.weight": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.36.gate_proj.weight_scale": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.36.up_proj.weight": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.36.up_proj.weight_scale": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.37.down_proj.weight": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.37.down_proj.weight_scale": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.37.gate_proj.weight": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.37.gate_proj.weight_scale": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.37.up_proj.weight": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.37.up_proj.weight_scale": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.38.down_proj.weight": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.38.down_proj.weight_scale": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.38.gate_proj.weight": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.38.gate_proj.weight_scale": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.38.up_proj.weight": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.38.up_proj.weight_scale": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.39.down_proj.weight": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.39.down_proj.weight_scale": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.39.gate_proj.weight": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.39.gate_proj.weight_scale": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.39.up_proj.weight": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.39.up_proj.weight_scale": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.4.down_proj.weight": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.4.down_proj.weight_scale": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.4.gate_proj.weight": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.4.gate_proj.weight_scale": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.4.up_proj.weight": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.4.up_proj.weight_scale": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.40.down_proj.weight": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.40.down_proj.weight_scale": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.40.gate_proj.weight": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.40.gate_proj.weight_scale": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.40.up_proj.weight": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.40.up_proj.weight_scale": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.41.down_proj.weight": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.41.down_proj.weight_scale": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.41.gate_proj.weight": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.41.gate_proj.weight_scale": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.41.up_proj.weight": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.41.up_proj.weight_scale": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.42.down_proj.weight": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.42.down_proj.weight_scale": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.42.gate_proj.weight": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.42.gate_proj.weight_scale": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.42.up_proj.weight": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.42.up_proj.weight_scale": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.43.down_proj.weight": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.43.down_proj.weight_scale": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.43.gate_proj.weight": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.43.gate_proj.weight_scale": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.43.up_proj.weight": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.43.up_proj.weight_scale": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.44.down_proj.weight": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.44.down_proj.weight_scale": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.44.gate_proj.weight": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.44.gate_proj.weight_scale": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.44.up_proj.weight": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.44.up_proj.weight_scale": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.45.down_proj.weight": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.45.down_proj.weight_scale": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.45.gate_proj.weight": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.45.gate_proj.weight_scale": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.45.up_proj.weight": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.45.up_proj.weight_scale": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.46.down_proj.weight": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.46.down_proj.weight_scale": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.46.gate_proj.weight": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.46.gate_proj.weight_scale": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.46.up_proj.weight": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.46.up_proj.weight_scale": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.47.down_proj.weight": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.47.down_proj.weight_scale": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.47.gate_proj.weight": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.47.gate_proj.weight_scale": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.47.up_proj.weight": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.47.up_proj.weight_scale": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.48.down_proj.weight": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.48.down_proj.weight_scale": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.48.gate_proj.weight": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.48.gate_proj.weight_scale": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.48.up_proj.weight": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.48.up_proj.weight_scale": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.49.down_proj.weight": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.49.down_proj.weight_scale": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.49.gate_proj.weight": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.49.gate_proj.weight_scale": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.49.up_proj.weight": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.49.up_proj.weight_scale": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.5.down_proj.weight": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.5.down_proj.weight_scale": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.5.gate_proj.weight": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.5.gate_proj.weight_scale": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.5.up_proj.weight": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.5.up_proj.weight_scale": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.50.down_proj.weight": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.50.down_proj.weight_scale": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.50.gate_proj.weight": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.50.gate_proj.weight_scale": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.50.up_proj.weight": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.50.up_proj.weight_scale": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.51.down_proj.weight": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.51.down_proj.weight_scale": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.51.gate_proj.weight": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.51.gate_proj.weight_scale": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.51.up_proj.weight": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.51.up_proj.weight_scale": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.52.down_proj.weight": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.52.down_proj.weight_scale": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.52.gate_proj.weight": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.52.gate_proj.weight_scale": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.52.up_proj.weight": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.52.up_proj.weight_scale": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.53.down_proj.weight": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.53.down_proj.weight_scale": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.53.gate_proj.weight": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.53.gate_proj.weight_scale": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.53.up_proj.weight": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.53.up_proj.weight_scale": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.54.down_proj.weight": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.54.down_proj.weight_scale": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.54.gate_proj.weight": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.54.gate_proj.weight_scale": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.54.up_proj.weight": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.54.up_proj.weight_scale": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.55.down_proj.weight": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.55.down_proj.weight_scale": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.55.gate_proj.weight": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.55.gate_proj.weight_scale": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.55.up_proj.weight": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.55.up_proj.weight_scale": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.56.down_proj.weight": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.56.down_proj.weight_scale": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.56.gate_proj.weight": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.56.gate_proj.weight_scale": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.56.up_proj.weight": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.56.up_proj.weight_scale": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.57.down_proj.weight": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.57.down_proj.weight_scale": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.57.gate_proj.weight": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.57.gate_proj.weight_scale": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.57.up_proj.weight": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.57.up_proj.weight_scale": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.58.down_proj.weight": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.58.down_proj.weight_scale": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.58.gate_proj.weight": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.58.gate_proj.weight_scale": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.58.up_proj.weight": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.58.up_proj.weight_scale": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.59.down_proj.weight": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.59.down_proj.weight_scale": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.59.gate_proj.weight": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.59.gate_proj.weight_scale": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.59.up_proj.weight": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.59.up_proj.weight_scale": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.6.down_proj.weight": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.6.down_proj.weight_scale": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.6.gate_proj.weight": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.6.gate_proj.weight_scale": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.6.up_proj.weight": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.6.up_proj.weight_scale": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.60.down_proj.weight": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.60.down_proj.weight_scale": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.60.gate_proj.weight": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.60.gate_proj.weight_scale": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.60.up_proj.weight": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.60.up_proj.weight_scale": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.61.down_proj.weight": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.61.down_proj.weight_scale": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.61.gate_proj.weight": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.61.gate_proj.weight_scale": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.61.up_proj.weight": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.61.up_proj.weight_scale": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.62.down_proj.weight": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.62.down_proj.weight_scale": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.62.gate_proj.weight": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.62.gate_proj.weight_scale": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.62.up_proj.weight": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.62.up_proj.weight_scale": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.63.down_proj.weight": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.63.down_proj.weight_scale": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.63.gate_proj.weight": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.63.gate_proj.weight_scale": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.63.up_proj.weight": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.63.up_proj.weight_scale": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.64.down_proj.weight": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.64.down_proj.weight_scale": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.64.gate_proj.weight": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.64.gate_proj.weight_scale": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.64.up_proj.weight": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.64.up_proj.weight_scale": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.65.down_proj.weight": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.65.down_proj.weight_scale": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.65.gate_proj.weight": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.65.gate_proj.weight_scale": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.65.up_proj.weight": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.65.up_proj.weight_scale": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.66.down_proj.weight": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.66.down_proj.weight_scale": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.66.gate_proj.weight": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.66.gate_proj.weight_scale": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.66.up_proj.weight": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.66.up_proj.weight_scale": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.67.down_proj.weight": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.67.down_proj.weight_scale": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.67.gate_proj.weight": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.67.gate_proj.weight_scale": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.67.up_proj.weight": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.67.up_proj.weight_scale": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.68.down_proj.weight": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.68.down_proj.weight_scale": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.68.gate_proj.weight": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.68.gate_proj.weight_scale": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.68.up_proj.weight": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.68.up_proj.weight_scale": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.69.down_proj.weight": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.69.down_proj.weight_scale": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.69.gate_proj.weight": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.69.gate_proj.weight_scale": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.69.up_proj.weight": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.69.up_proj.weight_scale": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.7.down_proj.weight": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.7.down_proj.weight_scale": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.7.gate_proj.weight": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.7.gate_proj.weight_scale": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.7.up_proj.weight": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.7.up_proj.weight_scale": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.70.down_proj.weight": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.70.down_proj.weight_scale": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.70.gate_proj.weight": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.70.gate_proj.weight_scale": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.70.up_proj.weight": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.70.up_proj.weight_scale": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.71.down_proj.weight": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.71.down_proj.weight_scale": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.71.gate_proj.weight": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.71.gate_proj.weight_scale": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.71.up_proj.weight": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.71.up_proj.weight_scale": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.72.down_proj.weight": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.72.down_proj.weight_scale": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.72.gate_proj.weight": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.72.gate_proj.weight_scale": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.72.up_proj.weight": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.72.up_proj.weight_scale": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.73.down_proj.weight": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.73.down_proj.weight_scale": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.73.gate_proj.weight": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.73.gate_proj.weight_scale": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.73.up_proj.weight": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.73.up_proj.weight_scale": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.74.down_proj.weight": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.74.down_proj.weight_scale": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.74.gate_proj.weight": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.74.gate_proj.weight_scale": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.74.up_proj.weight": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.74.up_proj.weight_scale": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.75.down_proj.weight": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.75.down_proj.weight_scale": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.75.gate_proj.weight": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.75.gate_proj.weight_scale": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.75.up_proj.weight": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.75.up_proj.weight_scale": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.76.down_proj.weight": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.76.down_proj.weight_scale": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.76.gate_proj.weight": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.76.gate_proj.weight_scale": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.76.up_proj.weight": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.76.up_proj.weight_scale": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.77.down_proj.weight": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.77.down_proj.weight_scale": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.77.gate_proj.weight": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.77.gate_proj.weight_scale": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.77.up_proj.weight": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.77.up_proj.weight_scale": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.78.down_proj.weight": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.78.down_proj.weight_scale": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.78.gate_proj.weight": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.78.gate_proj.weight_scale": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.78.up_proj.weight": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.78.up_proj.weight_scale": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.79.down_proj.weight": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.79.down_proj.weight_scale": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.79.gate_proj.weight": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.79.gate_proj.weight_scale": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.79.up_proj.weight": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.79.up_proj.weight_scale": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.8.down_proj.weight": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.8.down_proj.weight_scale": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.8.gate_proj.weight": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.8.gate_proj.weight_scale": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.8.up_proj.weight": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.8.up_proj.weight_scale": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.80.down_proj.weight": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.80.down_proj.weight_scale": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.80.gate_proj.weight": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.80.gate_proj.weight_scale": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.80.up_proj.weight": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.80.up_proj.weight_scale": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.81.down_proj.weight": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.81.down_proj.weight_scale": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.81.gate_proj.weight": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.81.gate_proj.weight_scale": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.81.up_proj.weight": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.81.up_proj.weight_scale": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.82.down_proj.weight": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.82.down_proj.weight_scale": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.82.gate_proj.weight": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.82.gate_proj.weight_scale": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.82.up_proj.weight": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.82.up_proj.weight_scale": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.83.down_proj.weight": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.83.down_proj.weight_scale": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.83.gate_proj.weight": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.83.gate_proj.weight_scale": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.83.up_proj.weight": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.83.up_proj.weight_scale": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.84.down_proj.weight": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.84.down_proj.weight_scale": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.84.gate_proj.weight": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.84.gate_proj.weight_scale": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.84.up_proj.weight": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.84.up_proj.weight_scale": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.85.down_proj.weight": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.85.down_proj.weight_scale": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.85.gate_proj.weight": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.85.gate_proj.weight_scale": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.85.up_proj.weight": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.85.up_proj.weight_scale": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.86.down_proj.weight": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.86.down_proj.weight_scale": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.86.gate_proj.weight": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.86.gate_proj.weight_scale": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.86.up_proj.weight": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.86.up_proj.weight_scale": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.87.down_proj.weight": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.87.down_proj.weight_scale": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.87.gate_proj.weight": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.87.gate_proj.weight_scale": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.87.up_proj.weight": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.87.up_proj.weight_scale": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.88.down_proj.weight": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.88.down_proj.weight_scale": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.88.gate_proj.weight": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.88.gate_proj.weight_scale": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.88.up_proj.weight": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.88.up_proj.weight_scale": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.89.down_proj.weight": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.89.down_proj.weight_scale": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.89.gate_proj.weight": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.89.gate_proj.weight_scale": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.89.up_proj.weight": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.89.up_proj.weight_scale": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.9.down_proj.weight": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.9.down_proj.weight_scale": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.9.gate_proj.weight": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.9.gate_proj.weight_scale": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.9.up_proj.weight": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.9.up_proj.weight_scale": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.90.down_proj.weight": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.90.down_proj.weight_scale": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.90.gate_proj.weight": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.90.gate_proj.weight_scale": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.90.up_proj.weight": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.90.up_proj.weight_scale": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.91.down_proj.weight": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.91.down_proj.weight_scale": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.91.gate_proj.weight": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.91.gate_proj.weight_scale": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.91.up_proj.weight": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.91.up_proj.weight_scale": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.92.down_proj.weight": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.92.down_proj.weight_scale": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.92.gate_proj.weight": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.92.gate_proj.weight_scale": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.92.up_proj.weight": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.92.up_proj.weight_scale": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.93.down_proj.weight": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.93.down_proj.weight_scale": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.93.gate_proj.weight": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.93.gate_proj.weight_scale": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.93.up_proj.weight": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.93.up_proj.weight_scale": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.94.down_proj.weight": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.94.down_proj.weight_scale": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.94.gate_proj.weight": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.94.gate_proj.weight_scale": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.94.up_proj.weight": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.94.up_proj.weight_scale": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.95.down_proj.weight": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.95.down_proj.weight_scale": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.95.gate_proj.weight": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.95.gate_proj.weight_scale": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.95.up_proj.weight": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.95.up_proj.weight_scale": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.96.down_proj.weight": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.96.down_proj.weight_scale": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.96.gate_proj.weight": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.96.gate_proj.weight_scale": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.96.up_proj.weight": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.96.up_proj.weight_scale": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.97.down_proj.weight": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.97.down_proj.weight_scale": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.97.gate_proj.weight": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.97.gate_proj.weight_scale": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.97.up_proj.weight": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.97.up_proj.weight_scale": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.98.down_proj.weight": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.98.down_proj.weight_scale": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.98.gate_proj.weight": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.98.gate_proj.weight_scale": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.98.up_proj.weight": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.98.up_proj.weight_scale": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.99.down_proj.weight": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.99.down_proj.weight_scale": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.99.gate_proj.weight": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.99.gate_proj.weight_scale": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.99.up_proj.weight": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.99.up_proj.weight_scale": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.gate.e_score_correction_bias": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.gate.weight": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.shared_experts.down_proj.weight": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.shared_experts.down_proj.weight_scale": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.shared_experts.gate_proj.weight": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.shared_experts.gate_proj.weight_scale": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.shared_experts.up_proj.weight": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.shared_experts.up_proj.weight_scale": "model-00027-of-00092.safetensors",
+ "model.layers.26.post_attention_layernorm.weight": "model-00027-of-00092.safetensors",
+ "model.layers.26.self_attn.k_norm.weight": "model-00027-of-00092.safetensors",
+ "model.layers.26.self_attn.k_proj.bias": "model-00027-of-00092.safetensors",
+ "model.layers.26.self_attn.k_proj.weight": "model-00027-of-00092.safetensors",
+ "model.layers.26.self_attn.k_proj.weight_scale": "model-00027-of-00092.safetensors",
+ "model.layers.26.self_attn.o_proj.weight": "model-00027-of-00092.safetensors",
+ "model.layers.26.self_attn.o_proj.weight_scale": "model-00027-of-00092.safetensors",
+ "model.layers.26.self_attn.q_norm.weight": "model-00027-of-00092.safetensors",
+ "model.layers.26.self_attn.q_proj.bias": "model-00027-of-00092.safetensors",
+ "model.layers.26.self_attn.q_proj.weight": "model-00027-of-00092.safetensors",
+ "model.layers.26.self_attn.q_proj.weight_scale": "model-00027-of-00092.safetensors",
+ "model.layers.26.self_attn.v_proj.bias": "model-00027-of-00092.safetensors",
+ "model.layers.26.self_attn.v_proj.weight": "model-00027-of-00092.safetensors",
+ "model.layers.26.self_attn.v_proj.weight_scale": "model-00027-of-00092.safetensors",
+ "model.layers.27.input_layernorm.weight": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.0.down_proj.weight": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.0.down_proj.weight_scale": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.0.gate_proj.weight": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.0.gate_proj.weight_scale": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.0.up_proj.weight": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.0.up_proj.weight_scale": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.1.down_proj.weight": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.1.down_proj.weight_scale": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.1.gate_proj.weight": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.1.gate_proj.weight_scale": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.1.up_proj.weight": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.1.up_proj.weight_scale": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.10.down_proj.weight": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.10.down_proj.weight_scale": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.10.gate_proj.weight": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.10.gate_proj.weight_scale": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.10.up_proj.weight": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.10.up_proj.weight_scale": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.100.down_proj.weight": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.100.down_proj.weight_scale": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.100.gate_proj.weight": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.100.gate_proj.weight_scale": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.100.up_proj.weight": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.100.up_proj.weight_scale": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.101.down_proj.weight": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.101.down_proj.weight_scale": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.101.gate_proj.weight": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.101.gate_proj.weight_scale": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.101.up_proj.weight": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.101.up_proj.weight_scale": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.102.down_proj.weight": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.102.down_proj.weight_scale": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.102.gate_proj.weight": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.102.gate_proj.weight_scale": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.102.up_proj.weight": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.102.up_proj.weight_scale": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.103.down_proj.weight": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.103.down_proj.weight_scale": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.103.gate_proj.weight": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.103.gate_proj.weight_scale": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.103.up_proj.weight": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.103.up_proj.weight_scale": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.104.down_proj.weight": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.104.down_proj.weight_scale": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.104.gate_proj.weight": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.104.gate_proj.weight_scale": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.104.up_proj.weight": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.104.up_proj.weight_scale": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.105.down_proj.weight": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.105.down_proj.weight_scale": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.105.gate_proj.weight": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.105.gate_proj.weight_scale": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.105.up_proj.weight": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.105.up_proj.weight_scale": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.106.down_proj.weight": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.106.down_proj.weight_scale": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.106.gate_proj.weight": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.106.gate_proj.weight_scale": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.106.up_proj.weight": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.106.up_proj.weight_scale": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.107.down_proj.weight": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.107.down_proj.weight_scale": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.107.gate_proj.weight": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.107.gate_proj.weight_scale": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.107.up_proj.weight": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.107.up_proj.weight_scale": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.108.down_proj.weight": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.108.down_proj.weight_scale": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.108.gate_proj.weight": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.108.gate_proj.weight_scale": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.108.up_proj.weight": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.108.up_proj.weight_scale": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.109.down_proj.weight": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.109.down_proj.weight_scale": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.109.gate_proj.weight": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.109.gate_proj.weight_scale": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.109.up_proj.weight": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.109.up_proj.weight_scale": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.11.down_proj.weight": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.11.down_proj.weight_scale": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.11.gate_proj.weight": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.11.gate_proj.weight_scale": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.11.up_proj.weight": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.11.up_proj.weight_scale": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.110.down_proj.weight": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.110.down_proj.weight_scale": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.110.gate_proj.weight": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.110.gate_proj.weight_scale": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.110.up_proj.weight": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.110.up_proj.weight_scale": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.111.down_proj.weight": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.111.down_proj.weight_scale": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.111.gate_proj.weight": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.111.gate_proj.weight_scale": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.111.up_proj.weight": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.111.up_proj.weight_scale": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.112.down_proj.weight": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.112.down_proj.weight_scale": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.112.gate_proj.weight": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.112.gate_proj.weight_scale": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.112.up_proj.weight": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.112.up_proj.weight_scale": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.113.down_proj.weight": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.113.down_proj.weight_scale": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.113.gate_proj.weight": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.113.gate_proj.weight_scale": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.113.up_proj.weight": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.113.up_proj.weight_scale": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.114.down_proj.weight": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.114.down_proj.weight_scale": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.114.gate_proj.weight": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.114.gate_proj.weight_scale": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.114.up_proj.weight": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.114.up_proj.weight_scale": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.115.down_proj.weight": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.115.down_proj.weight_scale": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.115.gate_proj.weight": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.115.gate_proj.weight_scale": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.115.up_proj.weight": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.115.up_proj.weight_scale": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.116.down_proj.weight": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.116.down_proj.weight_scale": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.116.gate_proj.weight": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.116.gate_proj.weight_scale": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.116.up_proj.weight": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.116.up_proj.weight_scale": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.117.down_proj.weight": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.117.down_proj.weight_scale": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.117.gate_proj.weight": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.117.gate_proj.weight_scale": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.117.up_proj.weight": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.117.up_proj.weight_scale": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.118.down_proj.weight": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.118.down_proj.weight_scale": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.118.gate_proj.weight": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.118.gate_proj.weight_scale": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.118.up_proj.weight": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.118.up_proj.weight_scale": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.119.down_proj.weight": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.119.down_proj.weight_scale": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.119.gate_proj.weight": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.119.gate_proj.weight_scale": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.119.up_proj.weight": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.119.up_proj.weight_scale": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.12.down_proj.weight": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.12.down_proj.weight_scale": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.12.gate_proj.weight": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.12.gate_proj.weight_scale": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.12.up_proj.weight": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.12.up_proj.weight_scale": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.120.down_proj.weight": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.120.down_proj.weight_scale": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.120.gate_proj.weight": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.120.gate_proj.weight_scale": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.120.up_proj.weight": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.120.up_proj.weight_scale": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.121.down_proj.weight": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.121.down_proj.weight_scale": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.121.gate_proj.weight": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.121.gate_proj.weight_scale": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.121.up_proj.weight": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.121.up_proj.weight_scale": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.122.down_proj.weight": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.122.down_proj.weight_scale": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.122.gate_proj.weight": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.122.gate_proj.weight_scale": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.122.up_proj.weight": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.122.up_proj.weight_scale": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.123.down_proj.weight": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.123.down_proj.weight_scale": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.123.gate_proj.weight": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.123.gate_proj.weight_scale": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.123.up_proj.weight": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.123.up_proj.weight_scale": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.124.down_proj.weight": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.124.down_proj.weight_scale": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.124.gate_proj.weight": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.124.gate_proj.weight_scale": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.124.up_proj.weight": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.124.up_proj.weight_scale": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.125.down_proj.weight": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.125.down_proj.weight_scale": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.125.gate_proj.weight": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.125.gate_proj.weight_scale": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.125.up_proj.weight": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.125.up_proj.weight_scale": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.126.down_proj.weight": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.126.down_proj.weight_scale": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.126.gate_proj.weight": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.126.gate_proj.weight_scale": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.126.up_proj.weight": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.126.up_proj.weight_scale": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.127.down_proj.weight": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.127.down_proj.weight_scale": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.127.gate_proj.weight": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.127.gate_proj.weight_scale": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.127.up_proj.weight": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.127.up_proj.weight_scale": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.128.down_proj.weight": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.128.down_proj.weight_scale": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.128.gate_proj.weight": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.128.gate_proj.weight_scale": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.128.up_proj.weight": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.128.up_proj.weight_scale": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.129.down_proj.weight": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.129.down_proj.weight_scale": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.129.gate_proj.weight": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.129.gate_proj.weight_scale": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.129.up_proj.weight": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.129.up_proj.weight_scale": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.13.down_proj.weight": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.13.down_proj.weight_scale": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.13.gate_proj.weight": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.13.gate_proj.weight_scale": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.13.up_proj.weight": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.13.up_proj.weight_scale": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.130.down_proj.weight": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.130.down_proj.weight_scale": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.130.gate_proj.weight": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.130.gate_proj.weight_scale": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.130.up_proj.weight": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.130.up_proj.weight_scale": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.131.down_proj.weight": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.131.down_proj.weight_scale": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.131.gate_proj.weight": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.131.gate_proj.weight_scale": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.131.up_proj.weight": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.131.up_proj.weight_scale": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.132.down_proj.weight": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.132.down_proj.weight_scale": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.132.gate_proj.weight": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.132.gate_proj.weight_scale": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.132.up_proj.weight": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.132.up_proj.weight_scale": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.133.down_proj.weight": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.133.down_proj.weight_scale": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.133.gate_proj.weight": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.133.gate_proj.weight_scale": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.133.up_proj.weight": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.133.up_proj.weight_scale": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.134.down_proj.weight": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.134.down_proj.weight_scale": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.134.gate_proj.weight": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.134.gate_proj.weight_scale": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.134.up_proj.weight": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.134.up_proj.weight_scale": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.135.down_proj.weight": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.135.down_proj.weight_scale": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.135.gate_proj.weight": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.135.gate_proj.weight_scale": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.135.up_proj.weight": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.135.up_proj.weight_scale": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.136.down_proj.weight": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.136.down_proj.weight_scale": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.136.gate_proj.weight": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.136.gate_proj.weight_scale": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.136.up_proj.weight": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.136.up_proj.weight_scale": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.137.down_proj.weight": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.137.down_proj.weight_scale": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.137.gate_proj.weight": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.137.gate_proj.weight_scale": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.137.up_proj.weight": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.137.up_proj.weight_scale": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.138.down_proj.weight": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.138.down_proj.weight_scale": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.138.gate_proj.weight": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.138.gate_proj.weight_scale": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.138.up_proj.weight": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.138.up_proj.weight_scale": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.139.down_proj.weight": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.139.down_proj.weight_scale": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.139.gate_proj.weight": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.139.gate_proj.weight_scale": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.139.up_proj.weight": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.139.up_proj.weight_scale": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.14.down_proj.weight": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.14.down_proj.weight_scale": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.14.gate_proj.weight": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.14.gate_proj.weight_scale": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.14.up_proj.weight": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.14.up_proj.weight_scale": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.140.down_proj.weight": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.140.down_proj.weight_scale": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.140.gate_proj.weight": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.140.gate_proj.weight_scale": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.140.up_proj.weight": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.140.up_proj.weight_scale": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.141.down_proj.weight": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.141.down_proj.weight_scale": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.141.gate_proj.weight": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.141.gate_proj.weight_scale": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.141.up_proj.weight": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.141.up_proj.weight_scale": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.142.down_proj.weight": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.142.down_proj.weight_scale": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.142.gate_proj.weight": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.142.gate_proj.weight_scale": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.142.up_proj.weight": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.142.up_proj.weight_scale": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.143.down_proj.weight": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.143.down_proj.weight_scale": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.143.gate_proj.weight": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.143.gate_proj.weight_scale": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.143.up_proj.weight": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.143.up_proj.weight_scale": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.144.down_proj.weight": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.144.down_proj.weight_scale": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.144.gate_proj.weight": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.144.gate_proj.weight_scale": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.144.up_proj.weight": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.144.up_proj.weight_scale": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.145.down_proj.weight": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.145.down_proj.weight_scale": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.145.gate_proj.weight": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.145.gate_proj.weight_scale": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.145.up_proj.weight": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.145.up_proj.weight_scale": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.146.down_proj.weight": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.146.down_proj.weight_scale": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.146.gate_proj.weight": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.146.gate_proj.weight_scale": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.146.up_proj.weight": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.146.up_proj.weight_scale": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.147.down_proj.weight": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.147.down_proj.weight_scale": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.147.gate_proj.weight": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.147.gate_proj.weight_scale": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.147.up_proj.weight": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.147.up_proj.weight_scale": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.148.down_proj.weight": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.148.down_proj.weight_scale": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.148.gate_proj.weight": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.148.gate_proj.weight_scale": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.148.up_proj.weight": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.148.up_proj.weight_scale": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.149.down_proj.weight": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.149.down_proj.weight_scale": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.149.gate_proj.weight": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.149.gate_proj.weight_scale": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.149.up_proj.weight": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.149.up_proj.weight_scale": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.15.down_proj.weight": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.15.down_proj.weight_scale": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.15.gate_proj.weight": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.15.gate_proj.weight_scale": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.15.up_proj.weight": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.15.up_proj.weight_scale": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.150.down_proj.weight": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.150.down_proj.weight_scale": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.150.gate_proj.weight": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.150.gate_proj.weight_scale": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.150.up_proj.weight": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.150.up_proj.weight_scale": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.151.down_proj.weight": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.151.down_proj.weight_scale": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.151.gate_proj.weight": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.151.gate_proj.weight_scale": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.151.up_proj.weight": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.151.up_proj.weight_scale": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.152.down_proj.weight": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.152.down_proj.weight_scale": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.152.gate_proj.weight": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.152.gate_proj.weight_scale": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.152.up_proj.weight": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.152.up_proj.weight_scale": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.153.down_proj.weight": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.153.down_proj.weight_scale": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.153.gate_proj.weight": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.153.gate_proj.weight_scale": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.153.up_proj.weight": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.153.up_proj.weight_scale": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.154.down_proj.weight": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.154.down_proj.weight_scale": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.154.gate_proj.weight": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.154.gate_proj.weight_scale": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.154.up_proj.weight": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.154.up_proj.weight_scale": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.155.down_proj.weight": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.155.down_proj.weight_scale": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.155.gate_proj.weight": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.155.gate_proj.weight_scale": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.155.up_proj.weight": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.155.up_proj.weight_scale": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.156.down_proj.weight": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.156.down_proj.weight_scale": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.156.gate_proj.weight": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.156.gate_proj.weight_scale": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.156.up_proj.weight": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.156.up_proj.weight_scale": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.157.down_proj.weight": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.157.down_proj.weight_scale": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.157.gate_proj.weight": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.157.gate_proj.weight_scale": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.157.up_proj.weight": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.157.up_proj.weight_scale": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.158.down_proj.weight": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.158.down_proj.weight_scale": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.158.gate_proj.weight": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.158.gate_proj.weight_scale": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.158.up_proj.weight": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.158.up_proj.weight_scale": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.159.down_proj.weight": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.159.down_proj.weight_scale": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.159.gate_proj.weight": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.159.gate_proj.weight_scale": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.159.up_proj.weight": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.159.up_proj.weight_scale": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.16.down_proj.weight": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.16.down_proj.weight_scale": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.16.gate_proj.weight": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.16.gate_proj.weight_scale": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.16.up_proj.weight": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.16.up_proj.weight_scale": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.17.down_proj.weight": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.17.down_proj.weight_scale": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.17.gate_proj.weight": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.17.gate_proj.weight_scale": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.17.up_proj.weight": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.17.up_proj.weight_scale": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.18.down_proj.weight": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.18.down_proj.weight_scale": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.18.gate_proj.weight": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.18.gate_proj.weight_scale": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.18.up_proj.weight": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.18.up_proj.weight_scale": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.19.down_proj.weight": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.19.down_proj.weight_scale": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.19.gate_proj.weight": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.19.gate_proj.weight_scale": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.19.up_proj.weight": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.19.up_proj.weight_scale": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.2.down_proj.weight": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.2.down_proj.weight_scale": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.2.gate_proj.weight": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.2.gate_proj.weight_scale": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.2.up_proj.weight": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.2.up_proj.weight_scale": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.20.down_proj.weight": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.20.down_proj.weight_scale": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.20.gate_proj.weight": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.20.gate_proj.weight_scale": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.20.up_proj.weight": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.20.up_proj.weight_scale": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.21.down_proj.weight": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.21.down_proj.weight_scale": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.21.gate_proj.weight": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.21.gate_proj.weight_scale": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.21.up_proj.weight": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.21.up_proj.weight_scale": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.22.down_proj.weight": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.22.down_proj.weight_scale": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.22.gate_proj.weight": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.22.gate_proj.weight_scale": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.22.up_proj.weight": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.22.up_proj.weight_scale": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.23.down_proj.weight": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.23.down_proj.weight_scale": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.23.gate_proj.weight": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.23.gate_proj.weight_scale": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.23.up_proj.weight": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.23.up_proj.weight_scale": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.24.down_proj.weight": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.24.down_proj.weight_scale": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.24.gate_proj.weight": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.24.gate_proj.weight_scale": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.24.up_proj.weight": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.24.up_proj.weight_scale": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.25.down_proj.weight": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.25.down_proj.weight_scale": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.25.gate_proj.weight": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.25.gate_proj.weight_scale": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.25.up_proj.weight": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.25.up_proj.weight_scale": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.26.down_proj.weight": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.26.down_proj.weight_scale": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.26.gate_proj.weight": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.26.gate_proj.weight_scale": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.26.up_proj.weight": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.26.up_proj.weight_scale": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.27.down_proj.weight": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.27.down_proj.weight_scale": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.27.gate_proj.weight": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.27.gate_proj.weight_scale": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.27.up_proj.weight": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.27.up_proj.weight_scale": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.28.down_proj.weight": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.28.down_proj.weight_scale": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.28.gate_proj.weight": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.28.gate_proj.weight_scale": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.28.up_proj.weight": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.28.up_proj.weight_scale": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.29.down_proj.weight": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.29.down_proj.weight_scale": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.29.gate_proj.weight": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.29.gate_proj.weight_scale": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.29.up_proj.weight": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.29.up_proj.weight_scale": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.3.down_proj.weight": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.3.down_proj.weight_scale": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.3.gate_proj.weight": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.3.gate_proj.weight_scale": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.3.up_proj.weight": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.3.up_proj.weight_scale": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.30.down_proj.weight": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.30.down_proj.weight_scale": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.30.gate_proj.weight": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.30.gate_proj.weight_scale": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.30.up_proj.weight": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.30.up_proj.weight_scale": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.31.down_proj.weight": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.31.down_proj.weight_scale": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.31.gate_proj.weight": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.31.gate_proj.weight_scale": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.31.up_proj.weight": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.31.up_proj.weight_scale": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.32.down_proj.weight": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.32.down_proj.weight_scale": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.32.gate_proj.weight": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.32.gate_proj.weight_scale": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.32.up_proj.weight": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.32.up_proj.weight_scale": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.33.down_proj.weight": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.33.down_proj.weight_scale": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.33.gate_proj.weight": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.33.gate_proj.weight_scale": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.33.up_proj.weight": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.33.up_proj.weight_scale": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.34.down_proj.weight": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.34.down_proj.weight_scale": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.34.gate_proj.weight": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.34.gate_proj.weight_scale": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.34.up_proj.weight": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.34.up_proj.weight_scale": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.35.down_proj.weight": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.35.down_proj.weight_scale": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.35.gate_proj.weight": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.35.gate_proj.weight_scale": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.35.up_proj.weight": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.35.up_proj.weight_scale": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.36.down_proj.weight": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.36.down_proj.weight_scale": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.36.gate_proj.weight": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.36.gate_proj.weight_scale": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.36.up_proj.weight": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.36.up_proj.weight_scale": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.37.down_proj.weight": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.37.down_proj.weight_scale": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.37.gate_proj.weight": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.37.gate_proj.weight_scale": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.37.up_proj.weight": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.37.up_proj.weight_scale": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.38.down_proj.weight": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.38.down_proj.weight_scale": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.38.gate_proj.weight": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.38.gate_proj.weight_scale": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.38.up_proj.weight": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.38.up_proj.weight_scale": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.39.down_proj.weight": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.39.down_proj.weight_scale": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.39.gate_proj.weight": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.39.gate_proj.weight_scale": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.39.up_proj.weight": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.39.up_proj.weight_scale": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.4.down_proj.weight": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.4.down_proj.weight_scale": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.4.gate_proj.weight": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.4.gate_proj.weight_scale": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.4.up_proj.weight": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.4.up_proj.weight_scale": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.40.down_proj.weight": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.40.down_proj.weight_scale": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.40.gate_proj.weight": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.40.gate_proj.weight_scale": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.40.up_proj.weight": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.40.up_proj.weight_scale": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.41.down_proj.weight": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.41.down_proj.weight_scale": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.41.gate_proj.weight": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.41.gate_proj.weight_scale": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.41.up_proj.weight": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.41.up_proj.weight_scale": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.42.down_proj.weight": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.42.down_proj.weight_scale": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.42.gate_proj.weight": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.42.gate_proj.weight_scale": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.42.up_proj.weight": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.42.up_proj.weight_scale": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.43.down_proj.weight": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.43.down_proj.weight_scale": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.43.gate_proj.weight": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.43.gate_proj.weight_scale": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.43.up_proj.weight": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.43.up_proj.weight_scale": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.44.down_proj.weight": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.44.down_proj.weight_scale": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.44.gate_proj.weight": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.44.gate_proj.weight_scale": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.44.up_proj.weight": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.44.up_proj.weight_scale": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.45.down_proj.weight": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.45.down_proj.weight_scale": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.45.gate_proj.weight": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.45.gate_proj.weight_scale": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.45.up_proj.weight": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.45.up_proj.weight_scale": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.46.down_proj.weight": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.46.down_proj.weight_scale": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.46.gate_proj.weight": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.46.gate_proj.weight_scale": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.46.up_proj.weight": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.46.up_proj.weight_scale": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.47.down_proj.weight": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.47.down_proj.weight_scale": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.47.gate_proj.weight": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.47.gate_proj.weight_scale": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.47.up_proj.weight": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.47.up_proj.weight_scale": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.48.down_proj.weight": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.48.down_proj.weight_scale": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.48.gate_proj.weight": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.48.gate_proj.weight_scale": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.48.up_proj.weight": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.48.up_proj.weight_scale": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.49.down_proj.weight": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.49.down_proj.weight_scale": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.49.gate_proj.weight": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.49.gate_proj.weight_scale": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.49.up_proj.weight": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.49.up_proj.weight_scale": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.5.down_proj.weight": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.5.down_proj.weight_scale": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.5.gate_proj.weight": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.5.gate_proj.weight_scale": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.5.up_proj.weight": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.5.up_proj.weight_scale": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.50.down_proj.weight": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.50.down_proj.weight_scale": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.50.gate_proj.weight": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.50.gate_proj.weight_scale": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.50.up_proj.weight": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.50.up_proj.weight_scale": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.51.down_proj.weight": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.51.down_proj.weight_scale": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.51.gate_proj.weight": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.51.gate_proj.weight_scale": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.51.up_proj.weight": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.51.up_proj.weight_scale": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.52.down_proj.weight": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.52.down_proj.weight_scale": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.52.gate_proj.weight": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.52.gate_proj.weight_scale": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.52.up_proj.weight": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.52.up_proj.weight_scale": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.53.down_proj.weight": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.53.down_proj.weight_scale": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.53.gate_proj.weight": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.53.gate_proj.weight_scale": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.53.up_proj.weight": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.53.up_proj.weight_scale": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.54.down_proj.weight": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.54.down_proj.weight_scale": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.54.gate_proj.weight": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.54.gate_proj.weight_scale": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.54.up_proj.weight": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.54.up_proj.weight_scale": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.55.down_proj.weight": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.55.down_proj.weight_scale": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.55.gate_proj.weight": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.55.gate_proj.weight_scale": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.55.up_proj.weight": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.55.up_proj.weight_scale": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.56.down_proj.weight": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.56.down_proj.weight_scale": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.56.gate_proj.weight": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.56.gate_proj.weight_scale": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.56.up_proj.weight": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.56.up_proj.weight_scale": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.57.down_proj.weight": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.57.down_proj.weight_scale": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.57.gate_proj.weight": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.57.gate_proj.weight_scale": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.57.up_proj.weight": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.57.up_proj.weight_scale": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.58.down_proj.weight": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.58.down_proj.weight_scale": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.58.gate_proj.weight": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.58.gate_proj.weight_scale": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.58.up_proj.weight": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.58.up_proj.weight_scale": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.59.down_proj.weight": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.59.down_proj.weight_scale": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.59.gate_proj.weight": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.59.gate_proj.weight_scale": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.59.up_proj.weight": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.59.up_proj.weight_scale": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.6.down_proj.weight": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.6.down_proj.weight_scale": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.6.gate_proj.weight": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.6.gate_proj.weight_scale": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.6.up_proj.weight": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.6.up_proj.weight_scale": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.60.down_proj.weight": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.60.down_proj.weight_scale": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.60.gate_proj.weight": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.60.gate_proj.weight_scale": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.60.up_proj.weight": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.60.up_proj.weight_scale": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.61.down_proj.weight": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.61.down_proj.weight_scale": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.61.gate_proj.weight": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.61.gate_proj.weight_scale": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.61.up_proj.weight": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.61.up_proj.weight_scale": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.62.down_proj.weight": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.62.down_proj.weight_scale": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.62.gate_proj.weight": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.62.gate_proj.weight_scale": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.62.up_proj.weight": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.62.up_proj.weight_scale": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.63.down_proj.weight": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.63.down_proj.weight_scale": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.63.gate_proj.weight": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.63.gate_proj.weight_scale": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.63.up_proj.weight": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.63.up_proj.weight_scale": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.64.down_proj.weight": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.64.down_proj.weight_scale": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.64.gate_proj.weight": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.64.gate_proj.weight_scale": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.64.up_proj.weight": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.64.up_proj.weight_scale": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.65.down_proj.weight": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.65.down_proj.weight_scale": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.65.gate_proj.weight": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.65.gate_proj.weight_scale": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.65.up_proj.weight": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.65.up_proj.weight_scale": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.66.down_proj.weight": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.66.down_proj.weight_scale": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.66.gate_proj.weight": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.66.gate_proj.weight_scale": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.66.up_proj.weight": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.66.up_proj.weight_scale": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.67.down_proj.weight": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.67.down_proj.weight_scale": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.67.gate_proj.weight": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.67.gate_proj.weight_scale": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.67.up_proj.weight": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.67.up_proj.weight_scale": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.68.down_proj.weight": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.68.down_proj.weight_scale": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.68.gate_proj.weight": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.68.gate_proj.weight_scale": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.68.up_proj.weight": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.68.up_proj.weight_scale": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.69.down_proj.weight": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.69.down_proj.weight_scale": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.69.gate_proj.weight": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.69.gate_proj.weight_scale": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.69.up_proj.weight": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.69.up_proj.weight_scale": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.7.down_proj.weight": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.7.down_proj.weight_scale": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.7.gate_proj.weight": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.7.gate_proj.weight_scale": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.7.up_proj.weight": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.7.up_proj.weight_scale": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.70.down_proj.weight": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.70.down_proj.weight_scale": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.70.gate_proj.weight": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.70.gate_proj.weight_scale": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.70.up_proj.weight": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.70.up_proj.weight_scale": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.71.down_proj.weight": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.71.down_proj.weight_scale": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.71.gate_proj.weight": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.71.gate_proj.weight_scale": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.71.up_proj.weight": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.71.up_proj.weight_scale": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.72.down_proj.weight": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.72.down_proj.weight_scale": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.72.gate_proj.weight": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.72.gate_proj.weight_scale": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.72.up_proj.weight": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.72.up_proj.weight_scale": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.73.down_proj.weight": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.73.down_proj.weight_scale": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.73.gate_proj.weight": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.73.gate_proj.weight_scale": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.73.up_proj.weight": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.73.up_proj.weight_scale": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.74.down_proj.weight": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.74.down_proj.weight_scale": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.74.gate_proj.weight": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.74.gate_proj.weight_scale": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.74.up_proj.weight": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.74.up_proj.weight_scale": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.75.down_proj.weight": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.75.down_proj.weight_scale": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.75.gate_proj.weight": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.75.gate_proj.weight_scale": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.75.up_proj.weight": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.75.up_proj.weight_scale": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.76.down_proj.weight": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.76.down_proj.weight_scale": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.76.gate_proj.weight": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.76.gate_proj.weight_scale": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.76.up_proj.weight": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.76.up_proj.weight_scale": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.77.down_proj.weight": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.77.down_proj.weight_scale": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.77.gate_proj.weight": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.77.gate_proj.weight_scale": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.77.up_proj.weight": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.77.up_proj.weight_scale": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.78.down_proj.weight": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.78.down_proj.weight_scale": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.78.gate_proj.weight": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.78.gate_proj.weight_scale": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.78.up_proj.weight": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.78.up_proj.weight_scale": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.79.down_proj.weight": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.79.down_proj.weight_scale": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.79.gate_proj.weight": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.79.gate_proj.weight_scale": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.79.up_proj.weight": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.79.up_proj.weight_scale": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.8.down_proj.weight": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.8.down_proj.weight_scale": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.8.gate_proj.weight": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.8.gate_proj.weight_scale": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.8.up_proj.weight": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.8.up_proj.weight_scale": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.80.down_proj.weight": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.80.down_proj.weight_scale": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.80.gate_proj.weight": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.80.gate_proj.weight_scale": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.80.up_proj.weight": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.80.up_proj.weight_scale": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.81.down_proj.weight": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.81.down_proj.weight_scale": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.81.gate_proj.weight": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.81.gate_proj.weight_scale": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.81.up_proj.weight": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.81.up_proj.weight_scale": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.82.down_proj.weight": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.82.down_proj.weight_scale": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.82.gate_proj.weight": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.82.gate_proj.weight_scale": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.82.up_proj.weight": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.82.up_proj.weight_scale": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.83.down_proj.weight": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.83.down_proj.weight_scale": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.83.gate_proj.weight": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.83.gate_proj.weight_scale": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.83.up_proj.weight": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.83.up_proj.weight_scale": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.84.down_proj.weight": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.84.down_proj.weight_scale": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.84.gate_proj.weight": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.84.gate_proj.weight_scale": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.84.up_proj.weight": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.84.up_proj.weight_scale": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.85.down_proj.weight": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.85.down_proj.weight_scale": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.85.gate_proj.weight": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.85.gate_proj.weight_scale": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.85.up_proj.weight": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.85.up_proj.weight_scale": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.86.down_proj.weight": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.86.down_proj.weight_scale": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.86.gate_proj.weight": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.86.gate_proj.weight_scale": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.86.up_proj.weight": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.86.up_proj.weight_scale": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.87.down_proj.weight": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.87.down_proj.weight_scale": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.87.gate_proj.weight": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.87.gate_proj.weight_scale": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.87.up_proj.weight": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.87.up_proj.weight_scale": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.88.down_proj.weight": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.88.down_proj.weight_scale": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.88.gate_proj.weight": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.88.gate_proj.weight_scale": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.88.up_proj.weight": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.88.up_proj.weight_scale": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.89.down_proj.weight": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.89.down_proj.weight_scale": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.89.gate_proj.weight": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.89.gate_proj.weight_scale": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.89.up_proj.weight": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.89.up_proj.weight_scale": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.9.down_proj.weight": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.9.down_proj.weight_scale": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.9.gate_proj.weight": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.9.gate_proj.weight_scale": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.9.up_proj.weight": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.9.up_proj.weight_scale": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.90.down_proj.weight": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.90.down_proj.weight_scale": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.90.gate_proj.weight": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.90.gate_proj.weight_scale": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.90.up_proj.weight": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.90.up_proj.weight_scale": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.91.down_proj.weight": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.91.down_proj.weight_scale": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.91.gate_proj.weight": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.91.gate_proj.weight_scale": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.91.up_proj.weight": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.91.up_proj.weight_scale": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.92.down_proj.weight": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.92.down_proj.weight_scale": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.92.gate_proj.weight": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.92.gate_proj.weight_scale": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.92.up_proj.weight": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.92.up_proj.weight_scale": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.93.down_proj.weight": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.93.down_proj.weight_scale": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.93.gate_proj.weight": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.93.gate_proj.weight_scale": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.93.up_proj.weight": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.93.up_proj.weight_scale": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.94.down_proj.weight": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.94.down_proj.weight_scale": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.94.gate_proj.weight": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.94.gate_proj.weight_scale": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.94.up_proj.weight": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.94.up_proj.weight_scale": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.95.down_proj.weight": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.95.down_proj.weight_scale": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.95.gate_proj.weight": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.95.gate_proj.weight_scale": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.95.up_proj.weight": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.95.up_proj.weight_scale": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.96.down_proj.weight": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.96.down_proj.weight_scale": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.96.gate_proj.weight": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.96.gate_proj.weight_scale": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.96.up_proj.weight": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.96.up_proj.weight_scale": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.97.down_proj.weight": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.97.down_proj.weight_scale": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.97.gate_proj.weight": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.97.gate_proj.weight_scale": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.97.up_proj.weight": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.97.up_proj.weight_scale": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.98.down_proj.weight": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.98.down_proj.weight_scale": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.98.gate_proj.weight": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.98.gate_proj.weight_scale": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.98.up_proj.weight": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.98.up_proj.weight_scale": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.99.down_proj.weight": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.99.down_proj.weight_scale": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.99.gate_proj.weight": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.99.gate_proj.weight_scale": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.99.up_proj.weight": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.99.up_proj.weight_scale": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.gate.e_score_correction_bias": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.gate.weight": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.shared_experts.down_proj.weight": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.shared_experts.down_proj.weight_scale": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.shared_experts.gate_proj.weight": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.shared_experts.gate_proj.weight_scale": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.shared_experts.up_proj.weight": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.shared_experts.up_proj.weight_scale": "model-00028-of-00092.safetensors",
+ "model.layers.27.post_attention_layernorm.weight": "model-00028-of-00092.safetensors",
+ "model.layers.27.self_attn.k_norm.weight": "model-00028-of-00092.safetensors",
+ "model.layers.27.self_attn.k_proj.bias": "model-00028-of-00092.safetensors",
+ "model.layers.27.self_attn.k_proj.weight": "model-00028-of-00092.safetensors",
+ "model.layers.27.self_attn.k_proj.weight_scale": "model-00028-of-00092.safetensors",
+ "model.layers.27.self_attn.o_proj.weight": "model-00028-of-00092.safetensors",
+ "model.layers.27.self_attn.o_proj.weight_scale": "model-00028-of-00092.safetensors",
+ "model.layers.27.self_attn.q_norm.weight": "model-00028-of-00092.safetensors",
+ "model.layers.27.self_attn.q_proj.bias": "model-00028-of-00092.safetensors",
+ "model.layers.27.self_attn.q_proj.weight": "model-00028-of-00092.safetensors",
+ "model.layers.27.self_attn.q_proj.weight_scale": "model-00028-of-00092.safetensors",
+ "model.layers.27.self_attn.v_proj.bias": "model-00028-of-00092.safetensors",
+ "model.layers.27.self_attn.v_proj.weight": "model-00028-of-00092.safetensors",
+ "model.layers.27.self_attn.v_proj.weight_scale": "model-00028-of-00092.safetensors",
+ "model.layers.28.input_layernorm.weight": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.0.down_proj.weight": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.0.down_proj.weight_scale": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.0.gate_proj.weight": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.0.gate_proj.weight_scale": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.0.up_proj.weight": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.0.up_proj.weight_scale": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.1.down_proj.weight": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.1.down_proj.weight_scale": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.1.gate_proj.weight": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.1.gate_proj.weight_scale": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.1.up_proj.weight": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.1.up_proj.weight_scale": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.10.down_proj.weight": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.10.down_proj.weight_scale": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.10.gate_proj.weight": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.10.gate_proj.weight_scale": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.10.up_proj.weight": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.10.up_proj.weight_scale": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.100.down_proj.weight": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.100.down_proj.weight_scale": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.100.gate_proj.weight": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.100.gate_proj.weight_scale": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.100.up_proj.weight": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.100.up_proj.weight_scale": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.101.down_proj.weight": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.101.down_proj.weight_scale": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.101.gate_proj.weight": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.101.gate_proj.weight_scale": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.101.up_proj.weight": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.101.up_proj.weight_scale": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.102.down_proj.weight": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.102.down_proj.weight_scale": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.102.gate_proj.weight": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.102.gate_proj.weight_scale": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.102.up_proj.weight": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.102.up_proj.weight_scale": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.103.down_proj.weight": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.103.down_proj.weight_scale": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.103.gate_proj.weight": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.103.gate_proj.weight_scale": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.103.up_proj.weight": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.103.up_proj.weight_scale": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.104.down_proj.weight": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.104.down_proj.weight_scale": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.104.gate_proj.weight": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.104.gate_proj.weight_scale": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.104.up_proj.weight": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.104.up_proj.weight_scale": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.105.down_proj.weight": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.105.down_proj.weight_scale": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.105.gate_proj.weight": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.105.gate_proj.weight_scale": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.105.up_proj.weight": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.105.up_proj.weight_scale": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.106.down_proj.weight": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.106.down_proj.weight_scale": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.106.gate_proj.weight": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.106.gate_proj.weight_scale": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.106.up_proj.weight": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.106.up_proj.weight_scale": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.107.down_proj.weight": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.107.down_proj.weight_scale": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.107.gate_proj.weight": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.107.gate_proj.weight_scale": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.107.up_proj.weight": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.107.up_proj.weight_scale": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.108.down_proj.weight": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.108.down_proj.weight_scale": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.108.gate_proj.weight": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.108.gate_proj.weight_scale": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.108.up_proj.weight": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.108.up_proj.weight_scale": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.109.down_proj.weight": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.109.down_proj.weight_scale": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.109.gate_proj.weight": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.109.gate_proj.weight_scale": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.109.up_proj.weight": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.109.up_proj.weight_scale": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.11.down_proj.weight": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.11.down_proj.weight_scale": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.11.gate_proj.weight": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.11.gate_proj.weight_scale": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.11.up_proj.weight": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.11.up_proj.weight_scale": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.110.down_proj.weight": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.110.down_proj.weight_scale": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.110.gate_proj.weight": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.110.gate_proj.weight_scale": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.110.up_proj.weight": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.110.up_proj.weight_scale": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.111.down_proj.weight": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.111.down_proj.weight_scale": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.111.gate_proj.weight": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.111.gate_proj.weight_scale": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.111.up_proj.weight": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.111.up_proj.weight_scale": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.112.down_proj.weight": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.112.down_proj.weight_scale": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.112.gate_proj.weight": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.112.gate_proj.weight_scale": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.112.up_proj.weight": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.112.up_proj.weight_scale": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.113.down_proj.weight": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.113.down_proj.weight_scale": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.113.gate_proj.weight": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.113.gate_proj.weight_scale": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.113.up_proj.weight": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.113.up_proj.weight_scale": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.114.down_proj.weight": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.114.down_proj.weight_scale": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.114.gate_proj.weight": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.114.gate_proj.weight_scale": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.114.up_proj.weight": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.114.up_proj.weight_scale": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.115.down_proj.weight": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.115.down_proj.weight_scale": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.115.gate_proj.weight": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.115.gate_proj.weight_scale": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.115.up_proj.weight": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.115.up_proj.weight_scale": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.116.down_proj.weight": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.116.down_proj.weight_scale": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.116.gate_proj.weight": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.116.gate_proj.weight_scale": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.116.up_proj.weight": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.116.up_proj.weight_scale": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.117.down_proj.weight": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.117.down_proj.weight_scale": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.117.gate_proj.weight": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.117.gate_proj.weight_scale": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.117.up_proj.weight": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.117.up_proj.weight_scale": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.118.down_proj.weight": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.118.down_proj.weight_scale": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.118.gate_proj.weight": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.118.gate_proj.weight_scale": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.118.up_proj.weight": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.118.up_proj.weight_scale": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.119.down_proj.weight": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.119.down_proj.weight_scale": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.119.gate_proj.weight": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.119.gate_proj.weight_scale": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.119.up_proj.weight": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.119.up_proj.weight_scale": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.12.down_proj.weight": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.12.down_proj.weight_scale": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.12.gate_proj.weight": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.12.gate_proj.weight_scale": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.12.up_proj.weight": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.12.up_proj.weight_scale": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.120.down_proj.weight": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.120.down_proj.weight_scale": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.120.gate_proj.weight": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.120.gate_proj.weight_scale": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.120.up_proj.weight": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.120.up_proj.weight_scale": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.121.down_proj.weight": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.121.down_proj.weight_scale": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.121.gate_proj.weight": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.121.gate_proj.weight_scale": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.121.up_proj.weight": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.121.up_proj.weight_scale": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.122.down_proj.weight": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.122.down_proj.weight_scale": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.122.gate_proj.weight": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.122.gate_proj.weight_scale": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.122.up_proj.weight": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.122.up_proj.weight_scale": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.123.down_proj.weight": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.123.down_proj.weight_scale": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.123.gate_proj.weight": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.123.gate_proj.weight_scale": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.123.up_proj.weight": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.123.up_proj.weight_scale": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.124.down_proj.weight": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.124.down_proj.weight_scale": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.124.gate_proj.weight": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.124.gate_proj.weight_scale": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.124.up_proj.weight": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.124.up_proj.weight_scale": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.125.down_proj.weight": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.125.down_proj.weight_scale": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.125.gate_proj.weight": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.125.gate_proj.weight_scale": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.125.up_proj.weight": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.125.up_proj.weight_scale": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.126.down_proj.weight": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.126.down_proj.weight_scale": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.126.gate_proj.weight": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.126.gate_proj.weight_scale": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.126.up_proj.weight": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.126.up_proj.weight_scale": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.127.down_proj.weight": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.127.down_proj.weight_scale": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.127.gate_proj.weight": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.127.gate_proj.weight_scale": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.127.up_proj.weight": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.127.up_proj.weight_scale": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.128.down_proj.weight": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.128.down_proj.weight_scale": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.128.gate_proj.weight": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.128.gate_proj.weight_scale": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.128.up_proj.weight": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.128.up_proj.weight_scale": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.129.down_proj.weight": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.129.down_proj.weight_scale": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.129.gate_proj.weight": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.129.gate_proj.weight_scale": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.129.up_proj.weight": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.129.up_proj.weight_scale": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.13.down_proj.weight": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.13.down_proj.weight_scale": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.13.gate_proj.weight": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.13.gate_proj.weight_scale": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.13.up_proj.weight": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.13.up_proj.weight_scale": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.130.down_proj.weight": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.130.down_proj.weight_scale": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.130.gate_proj.weight": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.130.gate_proj.weight_scale": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.130.up_proj.weight": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.130.up_proj.weight_scale": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.131.down_proj.weight": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.131.down_proj.weight_scale": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.131.gate_proj.weight": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.131.gate_proj.weight_scale": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.131.up_proj.weight": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.131.up_proj.weight_scale": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.132.down_proj.weight": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.132.down_proj.weight_scale": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.132.gate_proj.weight": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.132.gate_proj.weight_scale": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.132.up_proj.weight": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.132.up_proj.weight_scale": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.133.down_proj.weight": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.133.down_proj.weight_scale": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.133.gate_proj.weight": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.133.gate_proj.weight_scale": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.133.up_proj.weight": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.133.up_proj.weight_scale": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.134.down_proj.weight": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.134.down_proj.weight_scale": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.134.gate_proj.weight": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.134.gate_proj.weight_scale": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.134.up_proj.weight": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.134.up_proj.weight_scale": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.135.down_proj.weight": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.135.down_proj.weight_scale": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.135.gate_proj.weight": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.135.gate_proj.weight_scale": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.135.up_proj.weight": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.135.up_proj.weight_scale": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.136.down_proj.weight": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.136.down_proj.weight_scale": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.136.gate_proj.weight": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.136.gate_proj.weight_scale": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.136.up_proj.weight": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.136.up_proj.weight_scale": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.137.down_proj.weight": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.137.down_proj.weight_scale": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.137.gate_proj.weight": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.137.gate_proj.weight_scale": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.137.up_proj.weight": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.137.up_proj.weight_scale": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.138.down_proj.weight": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.138.down_proj.weight_scale": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.138.gate_proj.weight": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.138.gate_proj.weight_scale": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.138.up_proj.weight": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.138.up_proj.weight_scale": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.139.down_proj.weight": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.139.down_proj.weight_scale": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.139.gate_proj.weight": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.139.gate_proj.weight_scale": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.139.up_proj.weight": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.139.up_proj.weight_scale": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.14.down_proj.weight": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.14.down_proj.weight_scale": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.14.gate_proj.weight": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.14.gate_proj.weight_scale": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.14.up_proj.weight": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.14.up_proj.weight_scale": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.140.down_proj.weight": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.140.down_proj.weight_scale": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.140.gate_proj.weight": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.140.gate_proj.weight_scale": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.140.up_proj.weight": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.140.up_proj.weight_scale": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.141.down_proj.weight": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.141.down_proj.weight_scale": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.141.gate_proj.weight": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.141.gate_proj.weight_scale": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.141.up_proj.weight": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.141.up_proj.weight_scale": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.142.down_proj.weight": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.142.down_proj.weight_scale": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.142.gate_proj.weight": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.142.gate_proj.weight_scale": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.142.up_proj.weight": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.142.up_proj.weight_scale": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.143.down_proj.weight": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.143.down_proj.weight_scale": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.143.gate_proj.weight": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.143.gate_proj.weight_scale": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.143.up_proj.weight": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.143.up_proj.weight_scale": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.144.down_proj.weight": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.144.down_proj.weight_scale": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.144.gate_proj.weight": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.144.gate_proj.weight_scale": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.144.up_proj.weight": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.144.up_proj.weight_scale": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.145.down_proj.weight": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.145.down_proj.weight_scale": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.145.gate_proj.weight": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.145.gate_proj.weight_scale": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.145.up_proj.weight": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.145.up_proj.weight_scale": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.146.down_proj.weight": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.146.down_proj.weight_scale": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.146.gate_proj.weight": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.146.gate_proj.weight_scale": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.146.up_proj.weight": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.146.up_proj.weight_scale": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.147.down_proj.weight": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.147.down_proj.weight_scale": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.147.gate_proj.weight": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.147.gate_proj.weight_scale": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.147.up_proj.weight": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.147.up_proj.weight_scale": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.148.down_proj.weight": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.148.down_proj.weight_scale": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.148.gate_proj.weight": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.148.gate_proj.weight_scale": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.148.up_proj.weight": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.148.up_proj.weight_scale": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.149.down_proj.weight": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.149.down_proj.weight_scale": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.149.gate_proj.weight": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.149.gate_proj.weight_scale": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.149.up_proj.weight": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.149.up_proj.weight_scale": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.15.down_proj.weight": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.15.down_proj.weight_scale": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.15.gate_proj.weight": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.15.gate_proj.weight_scale": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.15.up_proj.weight": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.15.up_proj.weight_scale": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.150.down_proj.weight": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.150.down_proj.weight_scale": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.150.gate_proj.weight": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.150.gate_proj.weight_scale": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.150.up_proj.weight": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.150.up_proj.weight_scale": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.151.down_proj.weight": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.151.down_proj.weight_scale": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.151.gate_proj.weight": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.151.gate_proj.weight_scale": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.151.up_proj.weight": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.151.up_proj.weight_scale": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.152.down_proj.weight": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.152.down_proj.weight_scale": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.152.gate_proj.weight": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.152.gate_proj.weight_scale": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.152.up_proj.weight": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.152.up_proj.weight_scale": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.153.down_proj.weight": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.153.down_proj.weight_scale": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.153.gate_proj.weight": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.153.gate_proj.weight_scale": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.153.up_proj.weight": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.153.up_proj.weight_scale": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.154.down_proj.weight": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.154.down_proj.weight_scale": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.154.gate_proj.weight": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.154.gate_proj.weight_scale": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.154.up_proj.weight": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.154.up_proj.weight_scale": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.155.down_proj.weight": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.155.down_proj.weight_scale": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.155.gate_proj.weight": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.155.gate_proj.weight_scale": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.155.up_proj.weight": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.155.up_proj.weight_scale": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.156.down_proj.weight": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.156.down_proj.weight_scale": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.156.gate_proj.weight": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.156.gate_proj.weight_scale": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.156.up_proj.weight": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.156.up_proj.weight_scale": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.157.down_proj.weight": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.157.down_proj.weight_scale": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.157.gate_proj.weight": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.157.gate_proj.weight_scale": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.157.up_proj.weight": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.157.up_proj.weight_scale": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.158.down_proj.weight": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.158.down_proj.weight_scale": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.158.gate_proj.weight": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.158.gate_proj.weight_scale": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.158.up_proj.weight": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.158.up_proj.weight_scale": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.159.down_proj.weight": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.159.down_proj.weight_scale": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.159.gate_proj.weight": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.159.gate_proj.weight_scale": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.159.up_proj.weight": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.159.up_proj.weight_scale": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.16.down_proj.weight": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.16.down_proj.weight_scale": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.16.gate_proj.weight": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.16.gate_proj.weight_scale": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.16.up_proj.weight": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.16.up_proj.weight_scale": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.17.down_proj.weight": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.17.down_proj.weight_scale": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.17.gate_proj.weight": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.17.gate_proj.weight_scale": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.17.up_proj.weight": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.17.up_proj.weight_scale": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.18.down_proj.weight": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.18.down_proj.weight_scale": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.18.gate_proj.weight": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.18.gate_proj.weight_scale": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.18.up_proj.weight": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.18.up_proj.weight_scale": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.19.down_proj.weight": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.19.down_proj.weight_scale": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.19.gate_proj.weight": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.19.gate_proj.weight_scale": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.19.up_proj.weight": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.19.up_proj.weight_scale": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.2.down_proj.weight": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.2.down_proj.weight_scale": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.2.gate_proj.weight": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.2.gate_proj.weight_scale": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.2.up_proj.weight": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.2.up_proj.weight_scale": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.20.down_proj.weight": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.20.down_proj.weight_scale": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.20.gate_proj.weight": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.20.gate_proj.weight_scale": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.20.up_proj.weight": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.20.up_proj.weight_scale": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.21.down_proj.weight": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.21.down_proj.weight_scale": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.21.gate_proj.weight": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.21.gate_proj.weight_scale": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.21.up_proj.weight": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.21.up_proj.weight_scale": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.22.down_proj.weight": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.22.down_proj.weight_scale": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.22.gate_proj.weight": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.22.gate_proj.weight_scale": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.22.up_proj.weight": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.22.up_proj.weight_scale": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.23.down_proj.weight": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.23.down_proj.weight_scale": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.23.gate_proj.weight": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.23.gate_proj.weight_scale": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.23.up_proj.weight": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.23.up_proj.weight_scale": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.24.down_proj.weight": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.24.down_proj.weight_scale": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.24.gate_proj.weight": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.24.gate_proj.weight_scale": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.24.up_proj.weight": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.24.up_proj.weight_scale": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.25.down_proj.weight": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.25.down_proj.weight_scale": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.25.gate_proj.weight": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.25.gate_proj.weight_scale": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.25.up_proj.weight": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.25.up_proj.weight_scale": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.26.down_proj.weight": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.26.down_proj.weight_scale": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.26.gate_proj.weight": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.26.gate_proj.weight_scale": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.26.up_proj.weight": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.26.up_proj.weight_scale": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.27.down_proj.weight": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.27.down_proj.weight_scale": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.27.gate_proj.weight": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.27.gate_proj.weight_scale": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.27.up_proj.weight": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.27.up_proj.weight_scale": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.28.down_proj.weight": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.28.down_proj.weight_scale": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.28.gate_proj.weight": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.28.gate_proj.weight_scale": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.28.up_proj.weight": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.28.up_proj.weight_scale": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.29.down_proj.weight": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.29.down_proj.weight_scale": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.29.gate_proj.weight": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.29.gate_proj.weight_scale": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.29.up_proj.weight": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.29.up_proj.weight_scale": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.3.down_proj.weight": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.3.down_proj.weight_scale": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.3.gate_proj.weight": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.3.gate_proj.weight_scale": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.3.up_proj.weight": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.3.up_proj.weight_scale": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.30.down_proj.weight": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.30.down_proj.weight_scale": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.30.gate_proj.weight": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.30.gate_proj.weight_scale": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.30.up_proj.weight": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.30.up_proj.weight_scale": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.31.down_proj.weight": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.31.down_proj.weight_scale": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.31.gate_proj.weight": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.31.gate_proj.weight_scale": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.31.up_proj.weight": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.31.up_proj.weight_scale": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.32.down_proj.weight": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.32.down_proj.weight_scale": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.32.gate_proj.weight": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.32.gate_proj.weight_scale": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.32.up_proj.weight": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.32.up_proj.weight_scale": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.33.down_proj.weight": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.33.down_proj.weight_scale": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.33.gate_proj.weight": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.33.gate_proj.weight_scale": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.33.up_proj.weight": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.33.up_proj.weight_scale": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.34.down_proj.weight": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.34.down_proj.weight_scale": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.34.gate_proj.weight": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.34.gate_proj.weight_scale": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.34.up_proj.weight": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.34.up_proj.weight_scale": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.35.down_proj.weight": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.35.down_proj.weight_scale": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.35.gate_proj.weight": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.35.gate_proj.weight_scale": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.35.up_proj.weight": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.35.up_proj.weight_scale": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.36.down_proj.weight": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.36.down_proj.weight_scale": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.36.gate_proj.weight": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.36.gate_proj.weight_scale": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.36.up_proj.weight": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.36.up_proj.weight_scale": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.37.down_proj.weight": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.37.down_proj.weight_scale": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.37.gate_proj.weight": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.37.gate_proj.weight_scale": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.37.up_proj.weight": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.37.up_proj.weight_scale": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.38.down_proj.weight": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.38.down_proj.weight_scale": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.38.gate_proj.weight": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.38.gate_proj.weight_scale": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.38.up_proj.weight": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.38.up_proj.weight_scale": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.39.down_proj.weight": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.39.down_proj.weight_scale": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.39.gate_proj.weight": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.39.gate_proj.weight_scale": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.39.up_proj.weight": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.39.up_proj.weight_scale": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.4.down_proj.weight": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.4.down_proj.weight_scale": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.4.gate_proj.weight": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.4.gate_proj.weight_scale": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.4.up_proj.weight": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.4.up_proj.weight_scale": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.40.down_proj.weight": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.40.down_proj.weight_scale": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.40.gate_proj.weight": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.40.gate_proj.weight_scale": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.40.up_proj.weight": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.40.up_proj.weight_scale": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.41.down_proj.weight": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.41.down_proj.weight_scale": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.41.gate_proj.weight": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.41.gate_proj.weight_scale": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.41.up_proj.weight": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.41.up_proj.weight_scale": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.42.down_proj.weight": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.42.down_proj.weight_scale": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.42.gate_proj.weight": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.42.gate_proj.weight_scale": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.42.up_proj.weight": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.42.up_proj.weight_scale": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.43.down_proj.weight": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.43.down_proj.weight_scale": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.43.gate_proj.weight": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.43.gate_proj.weight_scale": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.43.up_proj.weight": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.43.up_proj.weight_scale": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.44.down_proj.weight": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.44.down_proj.weight_scale": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.44.gate_proj.weight": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.44.gate_proj.weight_scale": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.44.up_proj.weight": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.44.up_proj.weight_scale": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.45.down_proj.weight": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.45.down_proj.weight_scale": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.45.gate_proj.weight": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.45.gate_proj.weight_scale": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.45.up_proj.weight": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.45.up_proj.weight_scale": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.46.down_proj.weight": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.46.down_proj.weight_scale": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.46.gate_proj.weight": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.46.gate_proj.weight_scale": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.46.up_proj.weight": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.46.up_proj.weight_scale": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.47.down_proj.weight": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.47.down_proj.weight_scale": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.47.gate_proj.weight": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.47.gate_proj.weight_scale": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.47.up_proj.weight": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.47.up_proj.weight_scale": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.48.down_proj.weight": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.48.down_proj.weight_scale": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.48.gate_proj.weight": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.48.gate_proj.weight_scale": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.48.up_proj.weight": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.48.up_proj.weight_scale": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.49.down_proj.weight": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.49.down_proj.weight_scale": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.49.gate_proj.weight": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.49.gate_proj.weight_scale": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.49.up_proj.weight": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.49.up_proj.weight_scale": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.5.down_proj.weight": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.5.down_proj.weight_scale": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.5.gate_proj.weight": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.5.gate_proj.weight_scale": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.5.up_proj.weight": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.5.up_proj.weight_scale": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.50.down_proj.weight": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.50.down_proj.weight_scale": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.50.gate_proj.weight": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.50.gate_proj.weight_scale": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.50.up_proj.weight": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.50.up_proj.weight_scale": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.51.down_proj.weight": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.51.down_proj.weight_scale": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.51.gate_proj.weight": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.51.gate_proj.weight_scale": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.51.up_proj.weight": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.51.up_proj.weight_scale": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.52.down_proj.weight": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.52.down_proj.weight_scale": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.52.gate_proj.weight": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.52.gate_proj.weight_scale": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.52.up_proj.weight": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.52.up_proj.weight_scale": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.53.down_proj.weight": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.53.down_proj.weight_scale": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.53.gate_proj.weight": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.53.gate_proj.weight_scale": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.53.up_proj.weight": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.53.up_proj.weight_scale": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.54.down_proj.weight": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.54.down_proj.weight_scale": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.54.gate_proj.weight": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.54.gate_proj.weight_scale": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.54.up_proj.weight": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.54.up_proj.weight_scale": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.55.down_proj.weight": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.55.down_proj.weight_scale": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.55.gate_proj.weight": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.55.gate_proj.weight_scale": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.55.up_proj.weight": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.55.up_proj.weight_scale": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.56.down_proj.weight": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.56.down_proj.weight_scale": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.56.gate_proj.weight": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.56.gate_proj.weight_scale": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.56.up_proj.weight": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.56.up_proj.weight_scale": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.57.down_proj.weight": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.57.down_proj.weight_scale": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.57.gate_proj.weight": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.57.gate_proj.weight_scale": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.57.up_proj.weight": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.57.up_proj.weight_scale": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.58.down_proj.weight": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.58.down_proj.weight_scale": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.58.gate_proj.weight": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.58.gate_proj.weight_scale": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.58.up_proj.weight": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.58.up_proj.weight_scale": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.59.down_proj.weight": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.59.down_proj.weight_scale": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.59.gate_proj.weight": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.59.gate_proj.weight_scale": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.59.up_proj.weight": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.59.up_proj.weight_scale": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.6.down_proj.weight": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.6.down_proj.weight_scale": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.6.gate_proj.weight": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.6.gate_proj.weight_scale": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.6.up_proj.weight": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.6.up_proj.weight_scale": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.60.down_proj.weight": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.60.down_proj.weight_scale": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.60.gate_proj.weight": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.60.gate_proj.weight_scale": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.60.up_proj.weight": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.60.up_proj.weight_scale": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.61.down_proj.weight": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.61.down_proj.weight_scale": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.61.gate_proj.weight": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.61.gate_proj.weight_scale": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.61.up_proj.weight": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.61.up_proj.weight_scale": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.62.down_proj.weight": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.62.down_proj.weight_scale": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.62.gate_proj.weight": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.62.gate_proj.weight_scale": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.62.up_proj.weight": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.62.up_proj.weight_scale": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.63.down_proj.weight": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.63.down_proj.weight_scale": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.63.gate_proj.weight": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.63.gate_proj.weight_scale": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.63.up_proj.weight": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.63.up_proj.weight_scale": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.64.down_proj.weight": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.64.down_proj.weight_scale": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.64.gate_proj.weight": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.64.gate_proj.weight_scale": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.64.up_proj.weight": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.64.up_proj.weight_scale": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.65.down_proj.weight": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.65.down_proj.weight_scale": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.65.gate_proj.weight": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.65.gate_proj.weight_scale": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.65.up_proj.weight": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.65.up_proj.weight_scale": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.66.down_proj.weight": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.66.down_proj.weight_scale": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.66.gate_proj.weight": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.66.gate_proj.weight_scale": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.66.up_proj.weight": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.66.up_proj.weight_scale": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.67.down_proj.weight": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.67.down_proj.weight_scale": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.67.gate_proj.weight": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.67.gate_proj.weight_scale": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.67.up_proj.weight": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.67.up_proj.weight_scale": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.68.down_proj.weight": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.68.down_proj.weight_scale": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.68.gate_proj.weight": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.68.gate_proj.weight_scale": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.68.up_proj.weight": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.68.up_proj.weight_scale": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.69.down_proj.weight": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.69.down_proj.weight_scale": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.69.gate_proj.weight": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.69.gate_proj.weight_scale": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.69.up_proj.weight": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.69.up_proj.weight_scale": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.7.down_proj.weight": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.7.down_proj.weight_scale": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.7.gate_proj.weight": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.7.gate_proj.weight_scale": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.7.up_proj.weight": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.7.up_proj.weight_scale": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.70.down_proj.weight": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.70.down_proj.weight_scale": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.70.gate_proj.weight": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.70.gate_proj.weight_scale": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.70.up_proj.weight": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.70.up_proj.weight_scale": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.71.down_proj.weight": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.71.down_proj.weight_scale": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.71.gate_proj.weight": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.71.gate_proj.weight_scale": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.71.up_proj.weight": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.71.up_proj.weight_scale": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.72.down_proj.weight": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.72.down_proj.weight_scale": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.72.gate_proj.weight": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.72.gate_proj.weight_scale": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.72.up_proj.weight": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.72.up_proj.weight_scale": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.73.down_proj.weight": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.73.down_proj.weight_scale": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.73.gate_proj.weight": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.73.gate_proj.weight_scale": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.73.up_proj.weight": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.73.up_proj.weight_scale": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.74.down_proj.weight": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.74.down_proj.weight_scale": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.74.gate_proj.weight": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.74.gate_proj.weight_scale": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.74.up_proj.weight": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.74.up_proj.weight_scale": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.75.down_proj.weight": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.75.down_proj.weight_scale": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.75.gate_proj.weight": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.75.gate_proj.weight_scale": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.75.up_proj.weight": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.75.up_proj.weight_scale": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.76.down_proj.weight": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.76.down_proj.weight_scale": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.76.gate_proj.weight": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.76.gate_proj.weight_scale": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.76.up_proj.weight": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.76.up_proj.weight_scale": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.77.down_proj.weight": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.77.down_proj.weight_scale": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.77.gate_proj.weight": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.77.gate_proj.weight_scale": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.77.up_proj.weight": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.77.up_proj.weight_scale": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.78.down_proj.weight": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.78.down_proj.weight_scale": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.78.gate_proj.weight": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.78.gate_proj.weight_scale": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.78.up_proj.weight": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.78.up_proj.weight_scale": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.79.down_proj.weight": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.79.down_proj.weight_scale": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.79.gate_proj.weight": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.79.gate_proj.weight_scale": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.79.up_proj.weight": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.79.up_proj.weight_scale": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.8.down_proj.weight": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.8.down_proj.weight_scale": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.8.gate_proj.weight": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.8.gate_proj.weight_scale": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.8.up_proj.weight": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.8.up_proj.weight_scale": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.80.down_proj.weight": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.80.down_proj.weight_scale": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.80.gate_proj.weight": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.80.gate_proj.weight_scale": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.80.up_proj.weight": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.80.up_proj.weight_scale": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.81.down_proj.weight": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.81.down_proj.weight_scale": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.81.gate_proj.weight": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.81.gate_proj.weight_scale": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.81.up_proj.weight": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.81.up_proj.weight_scale": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.82.down_proj.weight": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.82.down_proj.weight_scale": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.82.gate_proj.weight": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.82.gate_proj.weight_scale": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.82.up_proj.weight": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.82.up_proj.weight_scale": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.83.down_proj.weight": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.83.down_proj.weight_scale": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.83.gate_proj.weight": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.83.gate_proj.weight_scale": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.83.up_proj.weight": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.83.up_proj.weight_scale": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.84.down_proj.weight": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.84.down_proj.weight_scale": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.84.gate_proj.weight": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.84.gate_proj.weight_scale": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.84.up_proj.weight": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.84.up_proj.weight_scale": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.85.down_proj.weight": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.85.down_proj.weight_scale": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.85.gate_proj.weight": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.85.gate_proj.weight_scale": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.85.up_proj.weight": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.85.up_proj.weight_scale": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.86.down_proj.weight": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.86.down_proj.weight_scale": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.86.gate_proj.weight": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.86.gate_proj.weight_scale": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.86.up_proj.weight": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.86.up_proj.weight_scale": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.87.down_proj.weight": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.87.down_proj.weight_scale": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.87.gate_proj.weight": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.87.gate_proj.weight_scale": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.87.up_proj.weight": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.87.up_proj.weight_scale": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.88.down_proj.weight": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.88.down_proj.weight_scale": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.88.gate_proj.weight": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.88.gate_proj.weight_scale": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.88.up_proj.weight": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.88.up_proj.weight_scale": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.89.down_proj.weight": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.89.down_proj.weight_scale": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.89.gate_proj.weight": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.89.gate_proj.weight_scale": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.89.up_proj.weight": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.89.up_proj.weight_scale": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.9.down_proj.weight": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.9.down_proj.weight_scale": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.9.gate_proj.weight": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.9.gate_proj.weight_scale": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.9.up_proj.weight": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.9.up_proj.weight_scale": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.90.down_proj.weight": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.90.down_proj.weight_scale": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.90.gate_proj.weight": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.90.gate_proj.weight_scale": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.90.up_proj.weight": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.90.up_proj.weight_scale": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.91.down_proj.weight": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.91.down_proj.weight_scale": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.91.gate_proj.weight": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.91.gate_proj.weight_scale": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.91.up_proj.weight": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.91.up_proj.weight_scale": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.92.down_proj.weight": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.92.down_proj.weight_scale": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.92.gate_proj.weight": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.92.gate_proj.weight_scale": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.92.up_proj.weight": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.92.up_proj.weight_scale": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.93.down_proj.weight": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.93.down_proj.weight_scale": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.93.gate_proj.weight": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.93.gate_proj.weight_scale": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.93.up_proj.weight": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.93.up_proj.weight_scale": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.94.down_proj.weight": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.94.down_proj.weight_scale": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.94.gate_proj.weight": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.94.gate_proj.weight_scale": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.94.up_proj.weight": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.94.up_proj.weight_scale": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.95.down_proj.weight": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.95.down_proj.weight_scale": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.95.gate_proj.weight": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.95.gate_proj.weight_scale": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.95.up_proj.weight": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.95.up_proj.weight_scale": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.96.down_proj.weight": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.96.down_proj.weight_scale": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.96.gate_proj.weight": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.96.gate_proj.weight_scale": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.96.up_proj.weight": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.96.up_proj.weight_scale": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.97.down_proj.weight": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.97.down_proj.weight_scale": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.97.gate_proj.weight": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.97.gate_proj.weight_scale": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.97.up_proj.weight": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.97.up_proj.weight_scale": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.98.down_proj.weight": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.98.down_proj.weight_scale": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.98.gate_proj.weight": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.98.gate_proj.weight_scale": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.98.up_proj.weight": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.98.up_proj.weight_scale": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.99.down_proj.weight": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.99.down_proj.weight_scale": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.99.gate_proj.weight": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.99.gate_proj.weight_scale": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.99.up_proj.weight": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.99.up_proj.weight_scale": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.gate.e_score_correction_bias": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.gate.weight": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.shared_experts.down_proj.weight": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.shared_experts.down_proj.weight_scale": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.shared_experts.gate_proj.weight": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.shared_experts.gate_proj.weight_scale": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.shared_experts.up_proj.weight": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.shared_experts.up_proj.weight_scale": "model-00029-of-00092.safetensors",
+ "model.layers.28.post_attention_layernorm.weight": "model-00029-of-00092.safetensors",
+ "model.layers.28.self_attn.k_norm.weight": "model-00029-of-00092.safetensors",
+ "model.layers.28.self_attn.k_proj.bias": "model-00029-of-00092.safetensors",
+ "model.layers.28.self_attn.k_proj.weight": "model-00029-of-00092.safetensors",
+ "model.layers.28.self_attn.k_proj.weight_scale": "model-00029-of-00092.safetensors",
+ "model.layers.28.self_attn.o_proj.weight": "model-00029-of-00092.safetensors",
+ "model.layers.28.self_attn.o_proj.weight_scale": "model-00029-of-00092.safetensors",
+ "model.layers.28.self_attn.q_norm.weight": "model-00029-of-00092.safetensors",
+ "model.layers.28.self_attn.q_proj.bias": "model-00029-of-00092.safetensors",
+ "model.layers.28.self_attn.q_proj.weight": "model-00029-of-00092.safetensors",
+ "model.layers.28.self_attn.q_proj.weight_scale": "model-00029-of-00092.safetensors",
+ "model.layers.28.self_attn.v_proj.bias": "model-00029-of-00092.safetensors",
+ "model.layers.28.self_attn.v_proj.weight": "model-00029-of-00092.safetensors",
+ "model.layers.28.self_attn.v_proj.weight_scale": "model-00029-of-00092.safetensors",
+ "model.layers.29.input_layernorm.weight": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.0.down_proj.weight": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.0.down_proj.weight_scale": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.0.gate_proj.weight": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.0.gate_proj.weight_scale": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.0.up_proj.weight": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.0.up_proj.weight_scale": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.1.down_proj.weight": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.1.down_proj.weight_scale": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.1.gate_proj.weight": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.1.gate_proj.weight_scale": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.1.up_proj.weight": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.1.up_proj.weight_scale": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.10.down_proj.weight": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.10.down_proj.weight_scale": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.10.gate_proj.weight": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.10.gate_proj.weight_scale": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.10.up_proj.weight": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.10.up_proj.weight_scale": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.100.down_proj.weight": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.100.down_proj.weight_scale": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.100.gate_proj.weight": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.100.gate_proj.weight_scale": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.100.up_proj.weight": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.100.up_proj.weight_scale": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.101.down_proj.weight": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.101.down_proj.weight_scale": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.101.gate_proj.weight": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.101.gate_proj.weight_scale": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.101.up_proj.weight": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.101.up_proj.weight_scale": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.102.down_proj.weight": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.102.down_proj.weight_scale": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.102.gate_proj.weight": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.102.gate_proj.weight_scale": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.102.up_proj.weight": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.102.up_proj.weight_scale": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.103.down_proj.weight": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.103.down_proj.weight_scale": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.103.gate_proj.weight": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.103.gate_proj.weight_scale": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.103.up_proj.weight": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.103.up_proj.weight_scale": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.104.down_proj.weight": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.104.down_proj.weight_scale": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.104.gate_proj.weight": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.104.gate_proj.weight_scale": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.104.up_proj.weight": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.104.up_proj.weight_scale": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.105.down_proj.weight": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.105.down_proj.weight_scale": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.105.gate_proj.weight": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.105.gate_proj.weight_scale": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.105.up_proj.weight": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.105.up_proj.weight_scale": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.106.down_proj.weight": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.106.down_proj.weight_scale": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.106.gate_proj.weight": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.106.gate_proj.weight_scale": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.106.up_proj.weight": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.106.up_proj.weight_scale": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.107.down_proj.weight": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.107.down_proj.weight_scale": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.107.gate_proj.weight": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.107.gate_proj.weight_scale": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.107.up_proj.weight": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.107.up_proj.weight_scale": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.108.down_proj.weight": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.108.down_proj.weight_scale": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.108.gate_proj.weight": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.108.gate_proj.weight_scale": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.108.up_proj.weight": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.108.up_proj.weight_scale": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.109.down_proj.weight": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.109.down_proj.weight_scale": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.109.gate_proj.weight": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.109.gate_proj.weight_scale": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.109.up_proj.weight": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.109.up_proj.weight_scale": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.11.down_proj.weight": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.11.down_proj.weight_scale": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.11.gate_proj.weight": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.11.gate_proj.weight_scale": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.11.up_proj.weight": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.11.up_proj.weight_scale": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.110.down_proj.weight": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.110.down_proj.weight_scale": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.110.gate_proj.weight": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.110.gate_proj.weight_scale": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.110.up_proj.weight": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.110.up_proj.weight_scale": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.111.down_proj.weight": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.111.down_proj.weight_scale": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.111.gate_proj.weight": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.111.gate_proj.weight_scale": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.111.up_proj.weight": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.111.up_proj.weight_scale": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.112.down_proj.weight": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.112.down_proj.weight_scale": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.112.gate_proj.weight": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.112.gate_proj.weight_scale": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.112.up_proj.weight": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.112.up_proj.weight_scale": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.113.down_proj.weight": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.113.down_proj.weight_scale": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.113.gate_proj.weight": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.113.gate_proj.weight_scale": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.113.up_proj.weight": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.113.up_proj.weight_scale": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.114.down_proj.weight": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.114.down_proj.weight_scale": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.114.gate_proj.weight": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.114.gate_proj.weight_scale": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.114.up_proj.weight": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.114.up_proj.weight_scale": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.115.down_proj.weight": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.115.down_proj.weight_scale": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.115.gate_proj.weight": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.115.gate_proj.weight_scale": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.115.up_proj.weight": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.115.up_proj.weight_scale": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.116.down_proj.weight": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.116.down_proj.weight_scale": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.116.gate_proj.weight": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.116.gate_proj.weight_scale": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.116.up_proj.weight": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.116.up_proj.weight_scale": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.117.down_proj.weight": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.117.down_proj.weight_scale": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.117.gate_proj.weight": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.117.gate_proj.weight_scale": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.117.up_proj.weight": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.117.up_proj.weight_scale": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.118.down_proj.weight": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.118.down_proj.weight_scale": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.118.gate_proj.weight": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.118.gate_proj.weight_scale": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.118.up_proj.weight": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.118.up_proj.weight_scale": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.119.down_proj.weight": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.119.down_proj.weight_scale": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.119.gate_proj.weight": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.119.gate_proj.weight_scale": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.119.up_proj.weight": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.119.up_proj.weight_scale": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.12.down_proj.weight": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.12.down_proj.weight_scale": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.12.gate_proj.weight": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.12.gate_proj.weight_scale": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.12.up_proj.weight": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.12.up_proj.weight_scale": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.120.down_proj.weight": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.120.down_proj.weight_scale": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.120.gate_proj.weight": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.120.gate_proj.weight_scale": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.120.up_proj.weight": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.120.up_proj.weight_scale": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.121.down_proj.weight": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.121.down_proj.weight_scale": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.121.gate_proj.weight": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.121.gate_proj.weight_scale": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.121.up_proj.weight": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.121.up_proj.weight_scale": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.122.down_proj.weight": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.122.down_proj.weight_scale": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.122.gate_proj.weight": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.122.gate_proj.weight_scale": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.122.up_proj.weight": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.122.up_proj.weight_scale": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.123.down_proj.weight": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.123.down_proj.weight_scale": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.123.gate_proj.weight": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.123.gate_proj.weight_scale": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.123.up_proj.weight": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.123.up_proj.weight_scale": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.124.down_proj.weight": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.124.down_proj.weight_scale": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.124.gate_proj.weight": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.124.gate_proj.weight_scale": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.124.up_proj.weight": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.124.up_proj.weight_scale": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.125.down_proj.weight": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.125.down_proj.weight_scale": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.125.gate_proj.weight": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.125.gate_proj.weight_scale": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.125.up_proj.weight": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.125.up_proj.weight_scale": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.126.down_proj.weight": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.126.down_proj.weight_scale": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.126.gate_proj.weight": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.126.gate_proj.weight_scale": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.126.up_proj.weight": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.126.up_proj.weight_scale": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.127.down_proj.weight": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.127.down_proj.weight_scale": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.127.gate_proj.weight": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.127.gate_proj.weight_scale": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.127.up_proj.weight": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.127.up_proj.weight_scale": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.128.down_proj.weight": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.128.down_proj.weight_scale": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.128.gate_proj.weight": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.128.gate_proj.weight_scale": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.128.up_proj.weight": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.128.up_proj.weight_scale": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.129.down_proj.weight": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.129.down_proj.weight_scale": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.129.gate_proj.weight": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.129.gate_proj.weight_scale": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.129.up_proj.weight": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.129.up_proj.weight_scale": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.13.down_proj.weight": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.13.down_proj.weight_scale": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.13.gate_proj.weight": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.13.gate_proj.weight_scale": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.13.up_proj.weight": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.13.up_proj.weight_scale": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.130.down_proj.weight": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.130.down_proj.weight_scale": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.130.gate_proj.weight": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.130.gate_proj.weight_scale": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.130.up_proj.weight": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.130.up_proj.weight_scale": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.131.down_proj.weight": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.131.down_proj.weight_scale": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.131.gate_proj.weight": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.131.gate_proj.weight_scale": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.131.up_proj.weight": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.131.up_proj.weight_scale": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.132.down_proj.weight": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.132.down_proj.weight_scale": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.132.gate_proj.weight": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.132.gate_proj.weight_scale": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.132.up_proj.weight": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.132.up_proj.weight_scale": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.133.down_proj.weight": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.133.down_proj.weight_scale": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.133.gate_proj.weight": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.133.gate_proj.weight_scale": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.133.up_proj.weight": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.133.up_proj.weight_scale": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.134.down_proj.weight": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.134.down_proj.weight_scale": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.134.gate_proj.weight": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.134.gate_proj.weight_scale": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.134.up_proj.weight": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.134.up_proj.weight_scale": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.135.down_proj.weight": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.135.down_proj.weight_scale": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.135.gate_proj.weight": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.135.gate_proj.weight_scale": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.135.up_proj.weight": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.135.up_proj.weight_scale": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.136.down_proj.weight": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.136.down_proj.weight_scale": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.136.gate_proj.weight": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.136.gate_proj.weight_scale": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.136.up_proj.weight": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.136.up_proj.weight_scale": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.137.down_proj.weight": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.137.down_proj.weight_scale": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.137.gate_proj.weight": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.137.gate_proj.weight_scale": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.137.up_proj.weight": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.137.up_proj.weight_scale": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.138.down_proj.weight": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.138.down_proj.weight_scale": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.138.gate_proj.weight": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.138.gate_proj.weight_scale": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.138.up_proj.weight": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.138.up_proj.weight_scale": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.139.down_proj.weight": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.139.down_proj.weight_scale": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.139.gate_proj.weight": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.139.gate_proj.weight_scale": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.139.up_proj.weight": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.139.up_proj.weight_scale": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.14.down_proj.weight": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.14.down_proj.weight_scale": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.14.gate_proj.weight": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.14.gate_proj.weight_scale": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.14.up_proj.weight": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.14.up_proj.weight_scale": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.140.down_proj.weight": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.140.down_proj.weight_scale": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.140.gate_proj.weight": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.140.gate_proj.weight_scale": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.140.up_proj.weight": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.140.up_proj.weight_scale": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.141.down_proj.weight": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.141.down_proj.weight_scale": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.141.gate_proj.weight": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.141.gate_proj.weight_scale": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.141.up_proj.weight": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.141.up_proj.weight_scale": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.142.down_proj.weight": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.142.down_proj.weight_scale": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.142.gate_proj.weight": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.142.gate_proj.weight_scale": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.142.up_proj.weight": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.142.up_proj.weight_scale": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.143.down_proj.weight": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.143.down_proj.weight_scale": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.143.gate_proj.weight": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.143.gate_proj.weight_scale": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.143.up_proj.weight": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.143.up_proj.weight_scale": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.144.down_proj.weight": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.144.down_proj.weight_scale": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.144.gate_proj.weight": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.144.gate_proj.weight_scale": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.144.up_proj.weight": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.144.up_proj.weight_scale": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.145.down_proj.weight": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.145.down_proj.weight_scale": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.145.gate_proj.weight": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.145.gate_proj.weight_scale": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.145.up_proj.weight": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.145.up_proj.weight_scale": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.146.down_proj.weight": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.146.down_proj.weight_scale": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.146.gate_proj.weight": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.146.gate_proj.weight_scale": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.146.up_proj.weight": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.146.up_proj.weight_scale": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.147.down_proj.weight": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.147.down_proj.weight_scale": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.147.gate_proj.weight": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.147.gate_proj.weight_scale": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.147.up_proj.weight": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.147.up_proj.weight_scale": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.148.down_proj.weight": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.148.down_proj.weight_scale": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.148.gate_proj.weight": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.148.gate_proj.weight_scale": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.148.up_proj.weight": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.148.up_proj.weight_scale": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.149.down_proj.weight": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.149.down_proj.weight_scale": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.149.gate_proj.weight": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.149.gate_proj.weight_scale": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.149.up_proj.weight": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.149.up_proj.weight_scale": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.15.down_proj.weight": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.15.down_proj.weight_scale": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.15.gate_proj.weight": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.15.gate_proj.weight_scale": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.15.up_proj.weight": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.15.up_proj.weight_scale": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.150.down_proj.weight": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.150.down_proj.weight_scale": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.150.gate_proj.weight": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.150.gate_proj.weight_scale": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.150.up_proj.weight": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.150.up_proj.weight_scale": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.151.down_proj.weight": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.151.down_proj.weight_scale": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.151.gate_proj.weight": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.151.gate_proj.weight_scale": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.151.up_proj.weight": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.151.up_proj.weight_scale": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.152.down_proj.weight": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.152.down_proj.weight_scale": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.152.gate_proj.weight": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.152.gate_proj.weight_scale": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.152.up_proj.weight": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.152.up_proj.weight_scale": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.153.down_proj.weight": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.153.down_proj.weight_scale": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.153.gate_proj.weight": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.153.gate_proj.weight_scale": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.153.up_proj.weight": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.153.up_proj.weight_scale": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.154.down_proj.weight": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.154.down_proj.weight_scale": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.154.gate_proj.weight": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.154.gate_proj.weight_scale": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.154.up_proj.weight": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.154.up_proj.weight_scale": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.155.down_proj.weight": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.155.down_proj.weight_scale": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.155.gate_proj.weight": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.155.gate_proj.weight_scale": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.155.up_proj.weight": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.155.up_proj.weight_scale": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.156.down_proj.weight": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.156.down_proj.weight_scale": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.156.gate_proj.weight": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.156.gate_proj.weight_scale": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.156.up_proj.weight": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.156.up_proj.weight_scale": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.157.down_proj.weight": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.157.down_proj.weight_scale": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.157.gate_proj.weight": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.157.gate_proj.weight_scale": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.157.up_proj.weight": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.157.up_proj.weight_scale": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.158.down_proj.weight": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.158.down_proj.weight_scale": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.158.gate_proj.weight": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.158.gate_proj.weight_scale": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.158.up_proj.weight": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.158.up_proj.weight_scale": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.159.down_proj.weight": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.159.down_proj.weight_scale": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.159.gate_proj.weight": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.159.gate_proj.weight_scale": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.159.up_proj.weight": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.159.up_proj.weight_scale": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.16.down_proj.weight": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.16.down_proj.weight_scale": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.16.gate_proj.weight": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.16.gate_proj.weight_scale": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.16.up_proj.weight": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.16.up_proj.weight_scale": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.17.down_proj.weight": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.17.down_proj.weight_scale": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.17.gate_proj.weight": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.17.gate_proj.weight_scale": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.17.up_proj.weight": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.17.up_proj.weight_scale": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.18.down_proj.weight": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.18.down_proj.weight_scale": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.18.gate_proj.weight": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.18.gate_proj.weight_scale": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.18.up_proj.weight": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.18.up_proj.weight_scale": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.19.down_proj.weight": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.19.down_proj.weight_scale": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.19.gate_proj.weight": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.19.gate_proj.weight_scale": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.19.up_proj.weight": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.19.up_proj.weight_scale": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.2.down_proj.weight": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.2.down_proj.weight_scale": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.2.gate_proj.weight": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.2.gate_proj.weight_scale": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.2.up_proj.weight": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.2.up_proj.weight_scale": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.20.down_proj.weight": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.20.down_proj.weight_scale": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.20.gate_proj.weight": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.20.gate_proj.weight_scale": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.20.up_proj.weight": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.20.up_proj.weight_scale": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.21.down_proj.weight": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.21.down_proj.weight_scale": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.21.gate_proj.weight": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.21.gate_proj.weight_scale": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.21.up_proj.weight": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.21.up_proj.weight_scale": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.22.down_proj.weight": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.22.down_proj.weight_scale": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.22.gate_proj.weight": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.22.gate_proj.weight_scale": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.22.up_proj.weight": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.22.up_proj.weight_scale": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.23.down_proj.weight": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.23.down_proj.weight_scale": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.23.gate_proj.weight": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.23.gate_proj.weight_scale": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.23.up_proj.weight": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.23.up_proj.weight_scale": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.24.down_proj.weight": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.24.down_proj.weight_scale": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.24.gate_proj.weight": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.24.gate_proj.weight_scale": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.24.up_proj.weight": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.24.up_proj.weight_scale": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.25.down_proj.weight": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.25.down_proj.weight_scale": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.25.gate_proj.weight": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.25.gate_proj.weight_scale": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.25.up_proj.weight": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.25.up_proj.weight_scale": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.26.down_proj.weight": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.26.down_proj.weight_scale": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.26.gate_proj.weight": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.26.gate_proj.weight_scale": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.26.up_proj.weight": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.26.up_proj.weight_scale": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.27.down_proj.weight": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.27.down_proj.weight_scale": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.27.gate_proj.weight": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.27.gate_proj.weight_scale": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.27.up_proj.weight": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.27.up_proj.weight_scale": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.28.down_proj.weight": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.28.down_proj.weight_scale": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.28.gate_proj.weight": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.28.gate_proj.weight_scale": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.28.up_proj.weight": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.28.up_proj.weight_scale": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.29.down_proj.weight": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.29.down_proj.weight_scale": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.29.gate_proj.weight": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.29.gate_proj.weight_scale": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.29.up_proj.weight": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.29.up_proj.weight_scale": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.3.down_proj.weight": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.3.down_proj.weight_scale": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.3.gate_proj.weight": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.3.gate_proj.weight_scale": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.3.up_proj.weight": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.3.up_proj.weight_scale": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.30.down_proj.weight": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.30.down_proj.weight_scale": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.30.gate_proj.weight": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.30.gate_proj.weight_scale": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.30.up_proj.weight": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.30.up_proj.weight_scale": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.31.down_proj.weight": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.31.down_proj.weight_scale": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.31.gate_proj.weight": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.31.gate_proj.weight_scale": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.31.up_proj.weight": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.31.up_proj.weight_scale": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.32.down_proj.weight": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.32.down_proj.weight_scale": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.32.gate_proj.weight": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.32.gate_proj.weight_scale": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.32.up_proj.weight": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.32.up_proj.weight_scale": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.33.down_proj.weight": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.33.down_proj.weight_scale": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.33.gate_proj.weight": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.33.gate_proj.weight_scale": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.33.up_proj.weight": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.33.up_proj.weight_scale": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.34.down_proj.weight": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.34.down_proj.weight_scale": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.34.gate_proj.weight": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.34.gate_proj.weight_scale": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.34.up_proj.weight": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.34.up_proj.weight_scale": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.35.down_proj.weight": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.35.down_proj.weight_scale": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.35.gate_proj.weight": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.35.gate_proj.weight_scale": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.35.up_proj.weight": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.35.up_proj.weight_scale": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.36.down_proj.weight": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.36.down_proj.weight_scale": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.36.gate_proj.weight": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.36.gate_proj.weight_scale": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.36.up_proj.weight": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.36.up_proj.weight_scale": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.37.down_proj.weight": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.37.down_proj.weight_scale": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.37.gate_proj.weight": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.37.gate_proj.weight_scale": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.37.up_proj.weight": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.37.up_proj.weight_scale": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.38.down_proj.weight": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.38.down_proj.weight_scale": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.38.gate_proj.weight": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.38.gate_proj.weight_scale": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.38.up_proj.weight": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.38.up_proj.weight_scale": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.39.down_proj.weight": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.39.down_proj.weight_scale": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.39.gate_proj.weight": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.39.gate_proj.weight_scale": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.39.up_proj.weight": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.39.up_proj.weight_scale": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.4.down_proj.weight": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.4.down_proj.weight_scale": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.4.gate_proj.weight": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.4.gate_proj.weight_scale": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.4.up_proj.weight": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.4.up_proj.weight_scale": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.40.down_proj.weight": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.40.down_proj.weight_scale": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.40.gate_proj.weight": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.40.gate_proj.weight_scale": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.40.up_proj.weight": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.40.up_proj.weight_scale": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.41.down_proj.weight": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.41.down_proj.weight_scale": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.41.gate_proj.weight": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.41.gate_proj.weight_scale": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.41.up_proj.weight": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.41.up_proj.weight_scale": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.42.down_proj.weight": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.42.down_proj.weight_scale": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.42.gate_proj.weight": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.42.gate_proj.weight_scale": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.42.up_proj.weight": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.42.up_proj.weight_scale": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.43.down_proj.weight": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.43.down_proj.weight_scale": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.43.gate_proj.weight": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.43.gate_proj.weight_scale": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.43.up_proj.weight": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.43.up_proj.weight_scale": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.44.down_proj.weight": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.44.down_proj.weight_scale": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.44.gate_proj.weight": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.44.gate_proj.weight_scale": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.44.up_proj.weight": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.44.up_proj.weight_scale": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.45.down_proj.weight": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.45.down_proj.weight_scale": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.45.gate_proj.weight": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.45.gate_proj.weight_scale": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.45.up_proj.weight": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.45.up_proj.weight_scale": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.46.down_proj.weight": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.46.down_proj.weight_scale": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.46.gate_proj.weight": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.46.gate_proj.weight_scale": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.46.up_proj.weight": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.46.up_proj.weight_scale": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.47.down_proj.weight": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.47.down_proj.weight_scale": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.47.gate_proj.weight": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.47.gate_proj.weight_scale": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.47.up_proj.weight": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.47.up_proj.weight_scale": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.48.down_proj.weight": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.48.down_proj.weight_scale": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.48.gate_proj.weight": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.48.gate_proj.weight_scale": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.48.up_proj.weight": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.48.up_proj.weight_scale": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.49.down_proj.weight": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.49.down_proj.weight_scale": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.49.gate_proj.weight": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.49.gate_proj.weight_scale": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.49.up_proj.weight": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.49.up_proj.weight_scale": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.5.down_proj.weight": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.5.down_proj.weight_scale": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.5.gate_proj.weight": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.5.gate_proj.weight_scale": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.5.up_proj.weight": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.5.up_proj.weight_scale": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.50.down_proj.weight": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.50.down_proj.weight_scale": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.50.gate_proj.weight": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.50.gate_proj.weight_scale": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.50.up_proj.weight": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.50.up_proj.weight_scale": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.51.down_proj.weight": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.51.down_proj.weight_scale": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.51.gate_proj.weight": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.51.gate_proj.weight_scale": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.51.up_proj.weight": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.51.up_proj.weight_scale": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.52.down_proj.weight": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.52.down_proj.weight_scale": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.52.gate_proj.weight": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.52.gate_proj.weight_scale": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.52.up_proj.weight": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.52.up_proj.weight_scale": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.53.down_proj.weight": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.53.down_proj.weight_scale": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.53.gate_proj.weight": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.53.gate_proj.weight_scale": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.53.up_proj.weight": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.53.up_proj.weight_scale": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.54.down_proj.weight": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.54.down_proj.weight_scale": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.54.gate_proj.weight": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.54.gate_proj.weight_scale": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.54.up_proj.weight": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.54.up_proj.weight_scale": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.55.down_proj.weight": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.55.down_proj.weight_scale": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.55.gate_proj.weight": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.55.gate_proj.weight_scale": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.55.up_proj.weight": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.55.up_proj.weight_scale": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.56.down_proj.weight": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.56.down_proj.weight_scale": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.56.gate_proj.weight": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.56.gate_proj.weight_scale": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.56.up_proj.weight": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.56.up_proj.weight_scale": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.57.down_proj.weight": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.57.down_proj.weight_scale": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.57.gate_proj.weight": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.57.gate_proj.weight_scale": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.57.up_proj.weight": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.57.up_proj.weight_scale": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.58.down_proj.weight": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.58.down_proj.weight_scale": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.58.gate_proj.weight": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.58.gate_proj.weight_scale": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.58.up_proj.weight": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.58.up_proj.weight_scale": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.59.down_proj.weight": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.59.down_proj.weight_scale": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.59.gate_proj.weight": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.59.gate_proj.weight_scale": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.59.up_proj.weight": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.59.up_proj.weight_scale": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.6.down_proj.weight": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.6.down_proj.weight_scale": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.6.gate_proj.weight": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.6.gate_proj.weight_scale": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.6.up_proj.weight": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.6.up_proj.weight_scale": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.60.down_proj.weight": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.60.down_proj.weight_scale": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.60.gate_proj.weight": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.60.gate_proj.weight_scale": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.60.up_proj.weight": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.60.up_proj.weight_scale": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.61.down_proj.weight": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.61.down_proj.weight_scale": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.61.gate_proj.weight": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.61.gate_proj.weight_scale": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.61.up_proj.weight": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.61.up_proj.weight_scale": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.62.down_proj.weight": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.62.down_proj.weight_scale": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.62.gate_proj.weight": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.62.gate_proj.weight_scale": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.62.up_proj.weight": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.62.up_proj.weight_scale": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.63.down_proj.weight": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.63.down_proj.weight_scale": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.63.gate_proj.weight": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.63.gate_proj.weight_scale": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.63.up_proj.weight": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.63.up_proj.weight_scale": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.64.down_proj.weight": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.64.down_proj.weight_scale": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.64.gate_proj.weight": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.64.gate_proj.weight_scale": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.64.up_proj.weight": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.64.up_proj.weight_scale": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.65.down_proj.weight": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.65.down_proj.weight_scale": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.65.gate_proj.weight": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.65.gate_proj.weight_scale": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.65.up_proj.weight": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.65.up_proj.weight_scale": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.66.down_proj.weight": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.66.down_proj.weight_scale": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.66.gate_proj.weight": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.66.gate_proj.weight_scale": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.66.up_proj.weight": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.66.up_proj.weight_scale": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.67.down_proj.weight": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.67.down_proj.weight_scale": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.67.gate_proj.weight": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.67.gate_proj.weight_scale": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.67.up_proj.weight": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.67.up_proj.weight_scale": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.68.down_proj.weight": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.68.down_proj.weight_scale": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.68.gate_proj.weight": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.68.gate_proj.weight_scale": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.68.up_proj.weight": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.68.up_proj.weight_scale": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.69.down_proj.weight": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.69.down_proj.weight_scale": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.69.gate_proj.weight": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.69.gate_proj.weight_scale": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.69.up_proj.weight": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.69.up_proj.weight_scale": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.7.down_proj.weight": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.7.down_proj.weight_scale": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.7.gate_proj.weight": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.7.gate_proj.weight_scale": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.7.up_proj.weight": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.7.up_proj.weight_scale": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.70.down_proj.weight": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.70.down_proj.weight_scale": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.70.gate_proj.weight": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.70.gate_proj.weight_scale": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.70.up_proj.weight": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.70.up_proj.weight_scale": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.71.down_proj.weight": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.71.down_proj.weight_scale": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.71.gate_proj.weight": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.71.gate_proj.weight_scale": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.71.up_proj.weight": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.71.up_proj.weight_scale": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.72.down_proj.weight": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.72.down_proj.weight_scale": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.72.gate_proj.weight": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.72.gate_proj.weight_scale": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.72.up_proj.weight": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.72.up_proj.weight_scale": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.73.down_proj.weight": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.73.down_proj.weight_scale": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.73.gate_proj.weight": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.73.gate_proj.weight_scale": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.73.up_proj.weight": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.73.up_proj.weight_scale": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.74.down_proj.weight": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.74.down_proj.weight_scale": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.74.gate_proj.weight": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.74.gate_proj.weight_scale": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.74.up_proj.weight": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.74.up_proj.weight_scale": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.75.down_proj.weight": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.75.down_proj.weight_scale": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.75.gate_proj.weight": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.75.gate_proj.weight_scale": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.75.up_proj.weight": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.75.up_proj.weight_scale": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.76.down_proj.weight": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.76.down_proj.weight_scale": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.76.gate_proj.weight": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.76.gate_proj.weight_scale": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.76.up_proj.weight": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.76.up_proj.weight_scale": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.77.down_proj.weight": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.77.down_proj.weight_scale": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.77.gate_proj.weight": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.77.gate_proj.weight_scale": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.77.up_proj.weight": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.77.up_proj.weight_scale": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.78.down_proj.weight": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.78.down_proj.weight_scale": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.78.gate_proj.weight": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.78.gate_proj.weight_scale": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.78.up_proj.weight": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.78.up_proj.weight_scale": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.79.down_proj.weight": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.79.down_proj.weight_scale": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.79.gate_proj.weight": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.79.gate_proj.weight_scale": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.79.up_proj.weight": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.79.up_proj.weight_scale": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.8.down_proj.weight": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.8.down_proj.weight_scale": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.8.gate_proj.weight": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.8.gate_proj.weight_scale": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.8.up_proj.weight": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.8.up_proj.weight_scale": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.80.down_proj.weight": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.80.down_proj.weight_scale": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.80.gate_proj.weight": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.80.gate_proj.weight_scale": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.80.up_proj.weight": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.80.up_proj.weight_scale": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.81.down_proj.weight": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.81.down_proj.weight_scale": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.81.gate_proj.weight": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.81.gate_proj.weight_scale": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.81.up_proj.weight": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.81.up_proj.weight_scale": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.82.down_proj.weight": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.82.down_proj.weight_scale": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.82.gate_proj.weight": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.82.gate_proj.weight_scale": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.82.up_proj.weight": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.82.up_proj.weight_scale": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.83.down_proj.weight": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.83.down_proj.weight_scale": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.83.gate_proj.weight": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.83.gate_proj.weight_scale": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.83.up_proj.weight": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.83.up_proj.weight_scale": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.84.down_proj.weight": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.84.down_proj.weight_scale": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.84.gate_proj.weight": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.84.gate_proj.weight_scale": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.84.up_proj.weight": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.84.up_proj.weight_scale": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.85.down_proj.weight": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.85.down_proj.weight_scale": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.85.gate_proj.weight": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.85.gate_proj.weight_scale": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.85.up_proj.weight": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.85.up_proj.weight_scale": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.86.down_proj.weight": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.86.down_proj.weight_scale": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.86.gate_proj.weight": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.86.gate_proj.weight_scale": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.86.up_proj.weight": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.86.up_proj.weight_scale": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.87.down_proj.weight": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.87.down_proj.weight_scale": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.87.gate_proj.weight": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.87.gate_proj.weight_scale": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.87.up_proj.weight": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.87.up_proj.weight_scale": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.88.down_proj.weight": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.88.down_proj.weight_scale": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.88.gate_proj.weight": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.88.gate_proj.weight_scale": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.88.up_proj.weight": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.88.up_proj.weight_scale": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.89.down_proj.weight": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.89.down_proj.weight_scale": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.89.gate_proj.weight": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.89.gate_proj.weight_scale": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.89.up_proj.weight": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.89.up_proj.weight_scale": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.9.down_proj.weight": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.9.down_proj.weight_scale": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.9.gate_proj.weight": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.9.gate_proj.weight_scale": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.9.up_proj.weight": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.9.up_proj.weight_scale": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.90.down_proj.weight": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.90.down_proj.weight_scale": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.90.gate_proj.weight": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.90.gate_proj.weight_scale": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.90.up_proj.weight": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.90.up_proj.weight_scale": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.91.down_proj.weight": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.91.down_proj.weight_scale": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.91.gate_proj.weight": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.91.gate_proj.weight_scale": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.91.up_proj.weight": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.91.up_proj.weight_scale": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.92.down_proj.weight": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.92.down_proj.weight_scale": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.92.gate_proj.weight": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.92.gate_proj.weight_scale": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.92.up_proj.weight": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.92.up_proj.weight_scale": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.93.down_proj.weight": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.93.down_proj.weight_scale": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.93.gate_proj.weight": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.93.gate_proj.weight_scale": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.93.up_proj.weight": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.93.up_proj.weight_scale": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.94.down_proj.weight": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.94.down_proj.weight_scale": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.94.gate_proj.weight": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.94.gate_proj.weight_scale": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.94.up_proj.weight": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.94.up_proj.weight_scale": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.95.down_proj.weight": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.95.down_proj.weight_scale": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.95.gate_proj.weight": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.95.gate_proj.weight_scale": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.95.up_proj.weight": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.95.up_proj.weight_scale": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.96.down_proj.weight": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.96.down_proj.weight_scale": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.96.gate_proj.weight": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.96.gate_proj.weight_scale": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.96.up_proj.weight": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.96.up_proj.weight_scale": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.97.down_proj.weight": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.97.down_proj.weight_scale": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.97.gate_proj.weight": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.97.gate_proj.weight_scale": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.97.up_proj.weight": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.97.up_proj.weight_scale": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.98.down_proj.weight": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.98.down_proj.weight_scale": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.98.gate_proj.weight": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.98.gate_proj.weight_scale": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.98.up_proj.weight": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.98.up_proj.weight_scale": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.99.down_proj.weight": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.99.down_proj.weight_scale": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.99.gate_proj.weight": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.99.gate_proj.weight_scale": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.99.up_proj.weight": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.99.up_proj.weight_scale": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.gate.e_score_correction_bias": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.gate.weight": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.shared_experts.down_proj.weight": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.shared_experts.down_proj.weight_scale": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.shared_experts.gate_proj.weight": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.shared_experts.gate_proj.weight_scale": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.shared_experts.up_proj.weight": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.shared_experts.up_proj.weight_scale": "model-00030-of-00092.safetensors",
+ "model.layers.29.post_attention_layernorm.weight": "model-00030-of-00092.safetensors",
+ "model.layers.29.self_attn.k_norm.weight": "model-00030-of-00092.safetensors",
+ "model.layers.29.self_attn.k_proj.bias": "model-00030-of-00092.safetensors",
+ "model.layers.29.self_attn.k_proj.weight": "model-00030-of-00092.safetensors",
+ "model.layers.29.self_attn.k_proj.weight_scale": "model-00030-of-00092.safetensors",
+ "model.layers.29.self_attn.o_proj.weight": "model-00030-of-00092.safetensors",
+ "model.layers.29.self_attn.o_proj.weight_scale": "model-00030-of-00092.safetensors",
+ "model.layers.29.self_attn.q_norm.weight": "model-00030-of-00092.safetensors",
+ "model.layers.29.self_attn.q_proj.bias": "model-00030-of-00092.safetensors",
+ "model.layers.29.self_attn.q_proj.weight": "model-00030-of-00092.safetensors",
+ "model.layers.29.self_attn.q_proj.weight_scale": "model-00030-of-00092.safetensors",
+ "model.layers.29.self_attn.v_proj.bias": "model-00030-of-00092.safetensors",
+ "model.layers.29.self_attn.v_proj.weight": "model-00030-of-00092.safetensors",
+ "model.layers.29.self_attn.v_proj.weight_scale": "model-00030-of-00092.safetensors",
+ "model.layers.30.input_layernorm.weight": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.0.down_proj.weight": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.0.down_proj.weight_scale": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.0.gate_proj.weight": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.0.gate_proj.weight_scale": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.0.up_proj.weight": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.0.up_proj.weight_scale": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.1.down_proj.weight": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.1.down_proj.weight_scale": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.1.gate_proj.weight": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.1.gate_proj.weight_scale": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.1.up_proj.weight": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.1.up_proj.weight_scale": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.10.down_proj.weight": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.10.down_proj.weight_scale": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.10.gate_proj.weight": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.10.gate_proj.weight_scale": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.10.up_proj.weight": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.10.up_proj.weight_scale": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.100.down_proj.weight": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.100.down_proj.weight_scale": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.100.gate_proj.weight": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.100.gate_proj.weight_scale": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.100.up_proj.weight": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.100.up_proj.weight_scale": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.101.down_proj.weight": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.101.down_proj.weight_scale": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.101.gate_proj.weight": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.101.gate_proj.weight_scale": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.101.up_proj.weight": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.101.up_proj.weight_scale": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.102.down_proj.weight": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.102.down_proj.weight_scale": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.102.gate_proj.weight": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.102.gate_proj.weight_scale": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.102.up_proj.weight": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.102.up_proj.weight_scale": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.103.down_proj.weight": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.103.down_proj.weight_scale": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.103.gate_proj.weight": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.103.gate_proj.weight_scale": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.103.up_proj.weight": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.103.up_proj.weight_scale": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.104.down_proj.weight": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.104.down_proj.weight_scale": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.104.gate_proj.weight": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.104.gate_proj.weight_scale": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.104.up_proj.weight": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.104.up_proj.weight_scale": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.105.down_proj.weight": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.105.down_proj.weight_scale": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.105.gate_proj.weight": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.105.gate_proj.weight_scale": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.105.up_proj.weight": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.105.up_proj.weight_scale": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.106.down_proj.weight": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.106.down_proj.weight_scale": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.106.gate_proj.weight": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.106.gate_proj.weight_scale": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.106.up_proj.weight": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.106.up_proj.weight_scale": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.107.down_proj.weight": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.107.down_proj.weight_scale": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.107.gate_proj.weight": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.107.gate_proj.weight_scale": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.107.up_proj.weight": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.107.up_proj.weight_scale": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.108.down_proj.weight": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.108.down_proj.weight_scale": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.108.gate_proj.weight": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.108.gate_proj.weight_scale": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.108.up_proj.weight": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.108.up_proj.weight_scale": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.109.down_proj.weight": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.109.down_proj.weight_scale": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.109.gate_proj.weight": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.109.gate_proj.weight_scale": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.109.up_proj.weight": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.109.up_proj.weight_scale": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.11.down_proj.weight": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.11.down_proj.weight_scale": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.11.gate_proj.weight": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.11.gate_proj.weight_scale": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.11.up_proj.weight": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.11.up_proj.weight_scale": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.110.down_proj.weight": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.110.down_proj.weight_scale": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.110.gate_proj.weight": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.110.gate_proj.weight_scale": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.110.up_proj.weight": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.110.up_proj.weight_scale": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.111.down_proj.weight": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.111.down_proj.weight_scale": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.111.gate_proj.weight": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.111.gate_proj.weight_scale": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.111.up_proj.weight": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.111.up_proj.weight_scale": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.112.down_proj.weight": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.112.down_proj.weight_scale": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.112.gate_proj.weight": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.112.gate_proj.weight_scale": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.112.up_proj.weight": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.112.up_proj.weight_scale": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.113.down_proj.weight": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.113.down_proj.weight_scale": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.113.gate_proj.weight": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.113.gate_proj.weight_scale": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.113.up_proj.weight": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.113.up_proj.weight_scale": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.114.down_proj.weight": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.114.down_proj.weight_scale": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.114.gate_proj.weight": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.114.gate_proj.weight_scale": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.114.up_proj.weight": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.114.up_proj.weight_scale": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.115.down_proj.weight": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.115.down_proj.weight_scale": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.115.gate_proj.weight": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.115.gate_proj.weight_scale": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.115.up_proj.weight": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.115.up_proj.weight_scale": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.116.down_proj.weight": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.116.down_proj.weight_scale": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.116.gate_proj.weight": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.116.gate_proj.weight_scale": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.116.up_proj.weight": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.116.up_proj.weight_scale": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.117.down_proj.weight": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.117.down_proj.weight_scale": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.117.gate_proj.weight": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.117.gate_proj.weight_scale": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.117.up_proj.weight": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.117.up_proj.weight_scale": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.118.down_proj.weight": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.118.down_proj.weight_scale": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.118.gate_proj.weight": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.118.gate_proj.weight_scale": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.118.up_proj.weight": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.118.up_proj.weight_scale": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.119.down_proj.weight": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.119.down_proj.weight_scale": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.119.gate_proj.weight": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.119.gate_proj.weight_scale": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.119.up_proj.weight": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.119.up_proj.weight_scale": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.12.down_proj.weight": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.12.down_proj.weight_scale": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.12.gate_proj.weight": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.12.gate_proj.weight_scale": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.12.up_proj.weight": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.12.up_proj.weight_scale": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.120.down_proj.weight": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.120.down_proj.weight_scale": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.120.gate_proj.weight": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.120.gate_proj.weight_scale": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.120.up_proj.weight": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.120.up_proj.weight_scale": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.121.down_proj.weight": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.121.down_proj.weight_scale": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.121.gate_proj.weight": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.121.gate_proj.weight_scale": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.121.up_proj.weight": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.121.up_proj.weight_scale": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.122.down_proj.weight": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.122.down_proj.weight_scale": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.122.gate_proj.weight": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.122.gate_proj.weight_scale": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.122.up_proj.weight": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.122.up_proj.weight_scale": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.123.down_proj.weight": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.123.down_proj.weight_scale": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.123.gate_proj.weight": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.123.gate_proj.weight_scale": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.123.up_proj.weight": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.123.up_proj.weight_scale": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.124.down_proj.weight": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.124.down_proj.weight_scale": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.124.gate_proj.weight": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.124.gate_proj.weight_scale": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.124.up_proj.weight": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.124.up_proj.weight_scale": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.125.down_proj.weight": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.125.down_proj.weight_scale": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.125.gate_proj.weight": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.125.gate_proj.weight_scale": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.125.up_proj.weight": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.125.up_proj.weight_scale": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.126.down_proj.weight": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.126.down_proj.weight_scale": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.126.gate_proj.weight": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.126.gate_proj.weight_scale": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.126.up_proj.weight": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.126.up_proj.weight_scale": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.127.down_proj.weight": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.127.down_proj.weight_scale": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.127.gate_proj.weight": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.127.gate_proj.weight_scale": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.127.up_proj.weight": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.127.up_proj.weight_scale": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.128.down_proj.weight": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.128.down_proj.weight_scale": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.128.gate_proj.weight": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.128.gate_proj.weight_scale": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.128.up_proj.weight": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.128.up_proj.weight_scale": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.129.down_proj.weight": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.129.down_proj.weight_scale": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.129.gate_proj.weight": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.129.gate_proj.weight_scale": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.129.up_proj.weight": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.129.up_proj.weight_scale": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.13.down_proj.weight": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.13.down_proj.weight_scale": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.13.gate_proj.weight": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.13.gate_proj.weight_scale": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.13.up_proj.weight": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.13.up_proj.weight_scale": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.130.down_proj.weight": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.130.down_proj.weight_scale": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.130.gate_proj.weight": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.130.gate_proj.weight_scale": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.130.up_proj.weight": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.130.up_proj.weight_scale": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.131.down_proj.weight": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.131.down_proj.weight_scale": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.131.gate_proj.weight": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.131.gate_proj.weight_scale": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.131.up_proj.weight": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.131.up_proj.weight_scale": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.132.down_proj.weight": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.132.down_proj.weight_scale": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.132.gate_proj.weight": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.132.gate_proj.weight_scale": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.132.up_proj.weight": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.132.up_proj.weight_scale": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.133.down_proj.weight": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.133.down_proj.weight_scale": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.133.gate_proj.weight": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.133.gate_proj.weight_scale": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.133.up_proj.weight": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.133.up_proj.weight_scale": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.134.down_proj.weight": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.134.down_proj.weight_scale": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.134.gate_proj.weight": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.134.gate_proj.weight_scale": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.134.up_proj.weight": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.134.up_proj.weight_scale": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.135.down_proj.weight": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.135.down_proj.weight_scale": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.135.gate_proj.weight": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.135.gate_proj.weight_scale": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.135.up_proj.weight": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.135.up_proj.weight_scale": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.136.down_proj.weight": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.136.down_proj.weight_scale": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.136.gate_proj.weight": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.136.gate_proj.weight_scale": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.136.up_proj.weight": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.136.up_proj.weight_scale": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.137.down_proj.weight": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.137.down_proj.weight_scale": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.137.gate_proj.weight": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.137.gate_proj.weight_scale": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.137.up_proj.weight": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.137.up_proj.weight_scale": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.138.down_proj.weight": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.138.down_proj.weight_scale": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.138.gate_proj.weight": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.138.gate_proj.weight_scale": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.138.up_proj.weight": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.138.up_proj.weight_scale": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.139.down_proj.weight": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.139.down_proj.weight_scale": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.139.gate_proj.weight": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.139.gate_proj.weight_scale": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.139.up_proj.weight": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.139.up_proj.weight_scale": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.14.down_proj.weight": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.14.down_proj.weight_scale": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.14.gate_proj.weight": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.14.gate_proj.weight_scale": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.14.up_proj.weight": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.14.up_proj.weight_scale": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.140.down_proj.weight": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.140.down_proj.weight_scale": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.140.gate_proj.weight": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.140.gate_proj.weight_scale": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.140.up_proj.weight": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.140.up_proj.weight_scale": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.141.down_proj.weight": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.141.down_proj.weight_scale": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.141.gate_proj.weight": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.141.gate_proj.weight_scale": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.141.up_proj.weight": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.141.up_proj.weight_scale": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.142.down_proj.weight": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.142.down_proj.weight_scale": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.142.gate_proj.weight": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.142.gate_proj.weight_scale": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.142.up_proj.weight": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.142.up_proj.weight_scale": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.143.down_proj.weight": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.143.down_proj.weight_scale": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.143.gate_proj.weight": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.143.gate_proj.weight_scale": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.143.up_proj.weight": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.143.up_proj.weight_scale": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.144.down_proj.weight": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.144.down_proj.weight_scale": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.144.gate_proj.weight": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.144.gate_proj.weight_scale": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.144.up_proj.weight": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.144.up_proj.weight_scale": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.145.down_proj.weight": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.145.down_proj.weight_scale": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.145.gate_proj.weight": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.145.gate_proj.weight_scale": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.145.up_proj.weight": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.145.up_proj.weight_scale": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.146.down_proj.weight": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.146.down_proj.weight_scale": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.146.gate_proj.weight": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.146.gate_proj.weight_scale": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.146.up_proj.weight": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.146.up_proj.weight_scale": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.147.down_proj.weight": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.147.down_proj.weight_scale": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.147.gate_proj.weight": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.147.gate_proj.weight_scale": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.147.up_proj.weight": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.147.up_proj.weight_scale": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.148.down_proj.weight": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.148.down_proj.weight_scale": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.148.gate_proj.weight": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.148.gate_proj.weight_scale": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.148.up_proj.weight": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.148.up_proj.weight_scale": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.149.down_proj.weight": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.149.down_proj.weight_scale": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.149.gate_proj.weight": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.149.gate_proj.weight_scale": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.149.up_proj.weight": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.149.up_proj.weight_scale": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.15.down_proj.weight": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.15.down_proj.weight_scale": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.15.gate_proj.weight": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.15.gate_proj.weight_scale": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.15.up_proj.weight": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.15.up_proj.weight_scale": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.150.down_proj.weight": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.150.down_proj.weight_scale": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.150.gate_proj.weight": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.150.gate_proj.weight_scale": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.150.up_proj.weight": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.150.up_proj.weight_scale": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.151.down_proj.weight": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.151.down_proj.weight_scale": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.151.gate_proj.weight": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.151.gate_proj.weight_scale": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.151.up_proj.weight": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.151.up_proj.weight_scale": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.152.down_proj.weight": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.152.down_proj.weight_scale": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.152.gate_proj.weight": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.152.gate_proj.weight_scale": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.152.up_proj.weight": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.152.up_proj.weight_scale": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.153.down_proj.weight": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.153.down_proj.weight_scale": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.153.gate_proj.weight": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.153.gate_proj.weight_scale": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.153.up_proj.weight": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.153.up_proj.weight_scale": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.154.down_proj.weight": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.154.down_proj.weight_scale": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.154.gate_proj.weight": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.154.gate_proj.weight_scale": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.154.up_proj.weight": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.154.up_proj.weight_scale": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.155.down_proj.weight": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.155.down_proj.weight_scale": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.155.gate_proj.weight": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.155.gate_proj.weight_scale": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.155.up_proj.weight": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.155.up_proj.weight_scale": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.156.down_proj.weight": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.156.down_proj.weight_scale": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.156.gate_proj.weight": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.156.gate_proj.weight_scale": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.156.up_proj.weight": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.156.up_proj.weight_scale": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.157.down_proj.weight": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.157.down_proj.weight_scale": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.157.gate_proj.weight": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.157.gate_proj.weight_scale": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.157.up_proj.weight": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.157.up_proj.weight_scale": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.158.down_proj.weight": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.158.down_proj.weight_scale": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.158.gate_proj.weight": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.158.gate_proj.weight_scale": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.158.up_proj.weight": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.158.up_proj.weight_scale": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.159.down_proj.weight": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.159.down_proj.weight_scale": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.159.gate_proj.weight": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.159.gate_proj.weight_scale": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.159.up_proj.weight": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.159.up_proj.weight_scale": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.16.down_proj.weight": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.16.down_proj.weight_scale": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.16.gate_proj.weight": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.16.gate_proj.weight_scale": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.16.up_proj.weight": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.16.up_proj.weight_scale": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.17.down_proj.weight": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.17.down_proj.weight_scale": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.17.gate_proj.weight": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.17.gate_proj.weight_scale": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.17.up_proj.weight": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.17.up_proj.weight_scale": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.18.down_proj.weight": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.18.down_proj.weight_scale": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.18.gate_proj.weight": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.18.gate_proj.weight_scale": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.18.up_proj.weight": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.18.up_proj.weight_scale": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.19.down_proj.weight": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.19.down_proj.weight_scale": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.19.gate_proj.weight": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.19.gate_proj.weight_scale": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.19.up_proj.weight": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.19.up_proj.weight_scale": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.2.down_proj.weight": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.2.down_proj.weight_scale": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.2.gate_proj.weight": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.2.gate_proj.weight_scale": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.2.up_proj.weight": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.2.up_proj.weight_scale": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.20.down_proj.weight": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.20.down_proj.weight_scale": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.20.gate_proj.weight": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.20.gate_proj.weight_scale": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.20.up_proj.weight": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.20.up_proj.weight_scale": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.21.down_proj.weight": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.21.down_proj.weight_scale": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.21.gate_proj.weight": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.21.gate_proj.weight_scale": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.21.up_proj.weight": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.21.up_proj.weight_scale": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.22.down_proj.weight": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.22.down_proj.weight_scale": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.22.gate_proj.weight": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.22.gate_proj.weight_scale": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.22.up_proj.weight": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.22.up_proj.weight_scale": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.23.down_proj.weight": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.23.down_proj.weight_scale": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.23.gate_proj.weight": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.23.gate_proj.weight_scale": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.23.up_proj.weight": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.23.up_proj.weight_scale": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.24.down_proj.weight": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.24.down_proj.weight_scale": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.24.gate_proj.weight": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.24.gate_proj.weight_scale": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.24.up_proj.weight": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.24.up_proj.weight_scale": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.25.down_proj.weight": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.25.down_proj.weight_scale": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.25.gate_proj.weight": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.25.gate_proj.weight_scale": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.25.up_proj.weight": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.25.up_proj.weight_scale": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.26.down_proj.weight": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.26.down_proj.weight_scale": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.26.gate_proj.weight": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.26.gate_proj.weight_scale": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.26.up_proj.weight": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.26.up_proj.weight_scale": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.27.down_proj.weight": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.27.down_proj.weight_scale": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.27.gate_proj.weight": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.27.gate_proj.weight_scale": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.27.up_proj.weight": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.27.up_proj.weight_scale": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.28.down_proj.weight": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.28.down_proj.weight_scale": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.28.gate_proj.weight": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.28.gate_proj.weight_scale": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.28.up_proj.weight": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.28.up_proj.weight_scale": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.29.down_proj.weight": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.29.down_proj.weight_scale": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.29.gate_proj.weight": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.29.gate_proj.weight_scale": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.29.up_proj.weight": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.29.up_proj.weight_scale": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.3.down_proj.weight": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.3.down_proj.weight_scale": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.3.gate_proj.weight": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.3.gate_proj.weight_scale": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.3.up_proj.weight": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.3.up_proj.weight_scale": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.30.down_proj.weight": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.30.down_proj.weight_scale": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.30.gate_proj.weight": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.30.gate_proj.weight_scale": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.30.up_proj.weight": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.30.up_proj.weight_scale": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.31.down_proj.weight": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.31.down_proj.weight_scale": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.31.gate_proj.weight": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.31.gate_proj.weight_scale": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.31.up_proj.weight": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.31.up_proj.weight_scale": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.32.down_proj.weight": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.32.down_proj.weight_scale": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.32.gate_proj.weight": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.32.gate_proj.weight_scale": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.32.up_proj.weight": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.32.up_proj.weight_scale": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.33.down_proj.weight": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.33.down_proj.weight_scale": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.33.gate_proj.weight": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.33.gate_proj.weight_scale": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.33.up_proj.weight": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.33.up_proj.weight_scale": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.34.down_proj.weight": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.34.down_proj.weight_scale": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.34.gate_proj.weight": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.34.gate_proj.weight_scale": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.34.up_proj.weight": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.34.up_proj.weight_scale": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.35.down_proj.weight": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.35.down_proj.weight_scale": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.35.gate_proj.weight": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.35.gate_proj.weight_scale": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.35.up_proj.weight": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.35.up_proj.weight_scale": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.36.down_proj.weight": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.36.down_proj.weight_scale": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.36.gate_proj.weight": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.36.gate_proj.weight_scale": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.36.up_proj.weight": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.36.up_proj.weight_scale": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.37.down_proj.weight": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.37.down_proj.weight_scale": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.37.gate_proj.weight": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.37.gate_proj.weight_scale": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.37.up_proj.weight": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.37.up_proj.weight_scale": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.38.down_proj.weight": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.38.down_proj.weight_scale": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.38.gate_proj.weight": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.38.gate_proj.weight_scale": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.38.up_proj.weight": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.38.up_proj.weight_scale": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.39.down_proj.weight": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.39.down_proj.weight_scale": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.39.gate_proj.weight": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.39.gate_proj.weight_scale": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.39.up_proj.weight": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.39.up_proj.weight_scale": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.4.down_proj.weight": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.4.down_proj.weight_scale": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.4.gate_proj.weight": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.4.gate_proj.weight_scale": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.4.up_proj.weight": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.4.up_proj.weight_scale": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.40.down_proj.weight": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.40.down_proj.weight_scale": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.40.gate_proj.weight": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.40.gate_proj.weight_scale": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.40.up_proj.weight": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.40.up_proj.weight_scale": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.41.down_proj.weight": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.41.down_proj.weight_scale": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.41.gate_proj.weight": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.41.gate_proj.weight_scale": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.41.up_proj.weight": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.41.up_proj.weight_scale": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.42.down_proj.weight": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.42.down_proj.weight_scale": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.42.gate_proj.weight": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.42.gate_proj.weight_scale": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.42.up_proj.weight": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.42.up_proj.weight_scale": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.43.down_proj.weight": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.43.down_proj.weight_scale": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.43.gate_proj.weight": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.43.gate_proj.weight_scale": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.43.up_proj.weight": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.43.up_proj.weight_scale": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.44.down_proj.weight": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.44.down_proj.weight_scale": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.44.gate_proj.weight": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.44.gate_proj.weight_scale": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.44.up_proj.weight": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.44.up_proj.weight_scale": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.45.down_proj.weight": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.45.down_proj.weight_scale": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.45.gate_proj.weight": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.45.gate_proj.weight_scale": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.45.up_proj.weight": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.45.up_proj.weight_scale": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.46.down_proj.weight": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.46.down_proj.weight_scale": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.46.gate_proj.weight": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.46.gate_proj.weight_scale": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.46.up_proj.weight": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.46.up_proj.weight_scale": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.47.down_proj.weight": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.47.down_proj.weight_scale": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.47.gate_proj.weight": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.47.gate_proj.weight_scale": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.47.up_proj.weight": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.47.up_proj.weight_scale": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.48.down_proj.weight": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.48.down_proj.weight_scale": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.48.gate_proj.weight": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.48.gate_proj.weight_scale": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.48.up_proj.weight": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.48.up_proj.weight_scale": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.49.down_proj.weight": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.49.down_proj.weight_scale": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.49.gate_proj.weight": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.49.gate_proj.weight_scale": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.49.up_proj.weight": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.49.up_proj.weight_scale": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.5.down_proj.weight": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.5.down_proj.weight_scale": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.5.gate_proj.weight": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.5.gate_proj.weight_scale": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.5.up_proj.weight": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.5.up_proj.weight_scale": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.50.down_proj.weight": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.50.down_proj.weight_scale": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.50.gate_proj.weight": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.50.gate_proj.weight_scale": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.50.up_proj.weight": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.50.up_proj.weight_scale": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.51.down_proj.weight": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.51.down_proj.weight_scale": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.51.gate_proj.weight": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.51.gate_proj.weight_scale": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.51.up_proj.weight": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.51.up_proj.weight_scale": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.52.down_proj.weight": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.52.down_proj.weight_scale": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.52.gate_proj.weight": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.52.gate_proj.weight_scale": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.52.up_proj.weight": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.52.up_proj.weight_scale": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.53.down_proj.weight": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.53.down_proj.weight_scale": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.53.gate_proj.weight": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.53.gate_proj.weight_scale": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.53.up_proj.weight": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.53.up_proj.weight_scale": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.54.down_proj.weight": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.54.down_proj.weight_scale": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.54.gate_proj.weight": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.54.gate_proj.weight_scale": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.54.up_proj.weight": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.54.up_proj.weight_scale": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.55.down_proj.weight": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.55.down_proj.weight_scale": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.55.gate_proj.weight": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.55.gate_proj.weight_scale": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.55.up_proj.weight": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.55.up_proj.weight_scale": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.56.down_proj.weight": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.56.down_proj.weight_scale": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.56.gate_proj.weight": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.56.gate_proj.weight_scale": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.56.up_proj.weight": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.56.up_proj.weight_scale": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.57.down_proj.weight": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.57.down_proj.weight_scale": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.57.gate_proj.weight": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.57.gate_proj.weight_scale": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.57.up_proj.weight": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.57.up_proj.weight_scale": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.58.down_proj.weight": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.58.down_proj.weight_scale": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.58.gate_proj.weight": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.58.gate_proj.weight_scale": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.58.up_proj.weight": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.58.up_proj.weight_scale": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.59.down_proj.weight": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.59.down_proj.weight_scale": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.59.gate_proj.weight": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.59.gate_proj.weight_scale": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.59.up_proj.weight": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.59.up_proj.weight_scale": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.6.down_proj.weight": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.6.down_proj.weight_scale": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.6.gate_proj.weight": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.6.gate_proj.weight_scale": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.6.up_proj.weight": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.6.up_proj.weight_scale": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.60.down_proj.weight": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.60.down_proj.weight_scale": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.60.gate_proj.weight": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.60.gate_proj.weight_scale": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.60.up_proj.weight": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.60.up_proj.weight_scale": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.61.down_proj.weight": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.61.down_proj.weight_scale": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.61.gate_proj.weight": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.61.gate_proj.weight_scale": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.61.up_proj.weight": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.61.up_proj.weight_scale": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.62.down_proj.weight": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.62.down_proj.weight_scale": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.62.gate_proj.weight": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.62.gate_proj.weight_scale": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.62.up_proj.weight": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.62.up_proj.weight_scale": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.63.down_proj.weight": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.63.down_proj.weight_scale": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.63.gate_proj.weight": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.63.gate_proj.weight_scale": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.63.up_proj.weight": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.63.up_proj.weight_scale": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.64.down_proj.weight": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.64.down_proj.weight_scale": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.64.gate_proj.weight": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.64.gate_proj.weight_scale": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.64.up_proj.weight": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.64.up_proj.weight_scale": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.65.down_proj.weight": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.65.down_proj.weight_scale": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.65.gate_proj.weight": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.65.gate_proj.weight_scale": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.65.up_proj.weight": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.65.up_proj.weight_scale": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.66.down_proj.weight": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.66.down_proj.weight_scale": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.66.gate_proj.weight": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.66.gate_proj.weight_scale": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.66.up_proj.weight": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.66.up_proj.weight_scale": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.67.down_proj.weight": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.67.down_proj.weight_scale": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.67.gate_proj.weight": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.67.gate_proj.weight_scale": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.67.up_proj.weight": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.67.up_proj.weight_scale": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.68.down_proj.weight": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.68.down_proj.weight_scale": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.68.gate_proj.weight": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.68.gate_proj.weight_scale": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.68.up_proj.weight": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.68.up_proj.weight_scale": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.69.down_proj.weight": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.69.down_proj.weight_scale": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.69.gate_proj.weight": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.69.gate_proj.weight_scale": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.69.up_proj.weight": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.69.up_proj.weight_scale": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.7.down_proj.weight": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.7.down_proj.weight_scale": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.7.gate_proj.weight": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.7.gate_proj.weight_scale": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.7.up_proj.weight": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.7.up_proj.weight_scale": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.70.down_proj.weight": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.70.down_proj.weight_scale": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.70.gate_proj.weight": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.70.gate_proj.weight_scale": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.70.up_proj.weight": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.70.up_proj.weight_scale": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.71.down_proj.weight": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.71.down_proj.weight_scale": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.71.gate_proj.weight": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.71.gate_proj.weight_scale": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.71.up_proj.weight": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.71.up_proj.weight_scale": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.72.down_proj.weight": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.72.down_proj.weight_scale": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.72.gate_proj.weight": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.72.gate_proj.weight_scale": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.72.up_proj.weight": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.72.up_proj.weight_scale": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.73.down_proj.weight": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.73.down_proj.weight_scale": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.73.gate_proj.weight": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.73.gate_proj.weight_scale": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.73.up_proj.weight": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.73.up_proj.weight_scale": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.74.down_proj.weight": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.74.down_proj.weight_scale": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.74.gate_proj.weight": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.74.gate_proj.weight_scale": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.74.up_proj.weight": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.74.up_proj.weight_scale": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.75.down_proj.weight": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.75.down_proj.weight_scale": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.75.gate_proj.weight": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.75.gate_proj.weight_scale": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.75.up_proj.weight": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.75.up_proj.weight_scale": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.76.down_proj.weight": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.76.down_proj.weight_scale": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.76.gate_proj.weight": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.76.gate_proj.weight_scale": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.76.up_proj.weight": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.76.up_proj.weight_scale": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.77.down_proj.weight": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.77.down_proj.weight_scale": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.77.gate_proj.weight": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.77.gate_proj.weight_scale": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.77.up_proj.weight": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.77.up_proj.weight_scale": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.78.down_proj.weight": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.78.down_proj.weight_scale": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.78.gate_proj.weight": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.78.gate_proj.weight_scale": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.78.up_proj.weight": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.78.up_proj.weight_scale": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.79.down_proj.weight": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.79.down_proj.weight_scale": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.79.gate_proj.weight": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.79.gate_proj.weight_scale": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.79.up_proj.weight": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.79.up_proj.weight_scale": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.8.down_proj.weight": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.8.down_proj.weight_scale": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.8.gate_proj.weight": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.8.gate_proj.weight_scale": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.8.up_proj.weight": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.8.up_proj.weight_scale": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.80.down_proj.weight": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.80.down_proj.weight_scale": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.80.gate_proj.weight": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.80.gate_proj.weight_scale": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.80.up_proj.weight": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.80.up_proj.weight_scale": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.81.down_proj.weight": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.81.down_proj.weight_scale": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.81.gate_proj.weight": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.81.gate_proj.weight_scale": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.81.up_proj.weight": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.81.up_proj.weight_scale": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.82.down_proj.weight": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.82.down_proj.weight_scale": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.82.gate_proj.weight": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.82.gate_proj.weight_scale": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.82.up_proj.weight": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.82.up_proj.weight_scale": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.83.down_proj.weight": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.83.down_proj.weight_scale": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.83.gate_proj.weight": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.83.gate_proj.weight_scale": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.83.up_proj.weight": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.83.up_proj.weight_scale": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.84.down_proj.weight": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.84.down_proj.weight_scale": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.84.gate_proj.weight": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.84.gate_proj.weight_scale": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.84.up_proj.weight": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.84.up_proj.weight_scale": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.85.down_proj.weight": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.85.down_proj.weight_scale": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.85.gate_proj.weight": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.85.gate_proj.weight_scale": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.85.up_proj.weight": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.85.up_proj.weight_scale": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.86.down_proj.weight": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.86.down_proj.weight_scale": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.86.gate_proj.weight": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.86.gate_proj.weight_scale": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.86.up_proj.weight": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.86.up_proj.weight_scale": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.87.down_proj.weight": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.87.down_proj.weight_scale": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.87.gate_proj.weight": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.87.gate_proj.weight_scale": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.87.up_proj.weight": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.87.up_proj.weight_scale": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.88.down_proj.weight": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.88.down_proj.weight_scale": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.88.gate_proj.weight": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.88.gate_proj.weight_scale": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.88.up_proj.weight": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.88.up_proj.weight_scale": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.89.down_proj.weight": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.89.down_proj.weight_scale": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.89.gate_proj.weight": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.89.gate_proj.weight_scale": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.89.up_proj.weight": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.89.up_proj.weight_scale": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.9.down_proj.weight": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.9.down_proj.weight_scale": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.9.gate_proj.weight": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.9.gate_proj.weight_scale": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.9.up_proj.weight": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.9.up_proj.weight_scale": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.90.down_proj.weight": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.90.down_proj.weight_scale": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.90.gate_proj.weight": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.90.gate_proj.weight_scale": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.90.up_proj.weight": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.90.up_proj.weight_scale": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.91.down_proj.weight": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.91.down_proj.weight_scale": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.91.gate_proj.weight": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.91.gate_proj.weight_scale": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.91.up_proj.weight": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.91.up_proj.weight_scale": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.92.down_proj.weight": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.92.down_proj.weight_scale": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.92.gate_proj.weight": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.92.gate_proj.weight_scale": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.92.up_proj.weight": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.92.up_proj.weight_scale": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.93.down_proj.weight": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.93.down_proj.weight_scale": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.93.gate_proj.weight": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.93.gate_proj.weight_scale": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.93.up_proj.weight": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.93.up_proj.weight_scale": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.94.down_proj.weight": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.94.down_proj.weight_scale": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.94.gate_proj.weight": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.94.gate_proj.weight_scale": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.94.up_proj.weight": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.94.up_proj.weight_scale": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.95.down_proj.weight": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.95.down_proj.weight_scale": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.95.gate_proj.weight": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.95.gate_proj.weight_scale": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.95.up_proj.weight": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.95.up_proj.weight_scale": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.96.down_proj.weight": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.96.down_proj.weight_scale": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.96.gate_proj.weight": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.96.gate_proj.weight_scale": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.96.up_proj.weight": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.96.up_proj.weight_scale": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.97.down_proj.weight": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.97.down_proj.weight_scale": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.97.gate_proj.weight": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.97.gate_proj.weight_scale": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.97.up_proj.weight": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.97.up_proj.weight_scale": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.98.down_proj.weight": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.98.down_proj.weight_scale": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.98.gate_proj.weight": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.98.gate_proj.weight_scale": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.98.up_proj.weight": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.98.up_proj.weight_scale": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.99.down_proj.weight": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.99.down_proj.weight_scale": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.99.gate_proj.weight": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.99.gate_proj.weight_scale": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.99.up_proj.weight": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.99.up_proj.weight_scale": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.gate.e_score_correction_bias": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.gate.weight": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.shared_experts.down_proj.weight": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.shared_experts.down_proj.weight_scale": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.shared_experts.gate_proj.weight": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.shared_experts.gate_proj.weight_scale": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.shared_experts.up_proj.weight": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.shared_experts.up_proj.weight_scale": "model-00031-of-00092.safetensors",
+ "model.layers.30.post_attention_layernorm.weight": "model-00031-of-00092.safetensors",
+ "model.layers.30.self_attn.k_norm.weight": "model-00031-of-00092.safetensors",
+ "model.layers.30.self_attn.k_proj.bias": "model-00031-of-00092.safetensors",
+ "model.layers.30.self_attn.k_proj.weight": "model-00031-of-00092.safetensors",
+ "model.layers.30.self_attn.k_proj.weight_scale": "model-00031-of-00092.safetensors",
+ "model.layers.30.self_attn.o_proj.weight": "model-00031-of-00092.safetensors",
+ "model.layers.30.self_attn.o_proj.weight_scale": "model-00031-of-00092.safetensors",
+ "model.layers.30.self_attn.q_norm.weight": "model-00031-of-00092.safetensors",
+ "model.layers.30.self_attn.q_proj.bias": "model-00031-of-00092.safetensors",
+ "model.layers.30.self_attn.q_proj.weight": "model-00031-of-00092.safetensors",
+ "model.layers.30.self_attn.q_proj.weight_scale": "model-00031-of-00092.safetensors",
+ "model.layers.30.self_attn.v_proj.bias": "model-00031-of-00092.safetensors",
+ "model.layers.30.self_attn.v_proj.weight": "model-00031-of-00092.safetensors",
+ "model.layers.30.self_attn.v_proj.weight_scale": "model-00031-of-00092.safetensors",
+ "model.layers.31.input_layernorm.weight": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.0.down_proj.weight": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.0.down_proj.weight_scale": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.0.gate_proj.weight": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.0.gate_proj.weight_scale": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.0.up_proj.weight": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.0.up_proj.weight_scale": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.1.down_proj.weight": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.1.down_proj.weight_scale": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.1.gate_proj.weight": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.1.gate_proj.weight_scale": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.1.up_proj.weight": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.1.up_proj.weight_scale": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.10.down_proj.weight": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.10.down_proj.weight_scale": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.10.gate_proj.weight": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.10.gate_proj.weight_scale": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.10.up_proj.weight": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.10.up_proj.weight_scale": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.100.down_proj.weight": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.100.down_proj.weight_scale": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.100.gate_proj.weight": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.100.gate_proj.weight_scale": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.100.up_proj.weight": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.100.up_proj.weight_scale": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.101.down_proj.weight": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.101.down_proj.weight_scale": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.101.gate_proj.weight": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.101.gate_proj.weight_scale": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.101.up_proj.weight": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.101.up_proj.weight_scale": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.102.down_proj.weight": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.102.down_proj.weight_scale": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.102.gate_proj.weight": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.102.gate_proj.weight_scale": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.102.up_proj.weight": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.102.up_proj.weight_scale": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.103.down_proj.weight": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.103.down_proj.weight_scale": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.103.gate_proj.weight": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.103.gate_proj.weight_scale": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.103.up_proj.weight": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.103.up_proj.weight_scale": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.104.down_proj.weight": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.104.down_proj.weight_scale": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.104.gate_proj.weight": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.104.gate_proj.weight_scale": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.104.up_proj.weight": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.104.up_proj.weight_scale": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.105.down_proj.weight": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.105.down_proj.weight_scale": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.105.gate_proj.weight": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.105.gate_proj.weight_scale": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.105.up_proj.weight": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.105.up_proj.weight_scale": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.106.down_proj.weight": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.106.down_proj.weight_scale": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.106.gate_proj.weight": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.106.gate_proj.weight_scale": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.106.up_proj.weight": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.106.up_proj.weight_scale": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.107.down_proj.weight": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.107.down_proj.weight_scale": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.107.gate_proj.weight": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.107.gate_proj.weight_scale": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.107.up_proj.weight": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.107.up_proj.weight_scale": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.108.down_proj.weight": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.108.down_proj.weight_scale": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.108.gate_proj.weight": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.108.gate_proj.weight_scale": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.108.up_proj.weight": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.108.up_proj.weight_scale": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.109.down_proj.weight": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.109.down_proj.weight_scale": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.109.gate_proj.weight": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.109.gate_proj.weight_scale": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.109.up_proj.weight": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.109.up_proj.weight_scale": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.11.down_proj.weight": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.11.down_proj.weight_scale": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.11.gate_proj.weight": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.11.gate_proj.weight_scale": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.11.up_proj.weight": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.11.up_proj.weight_scale": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.110.down_proj.weight": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.110.down_proj.weight_scale": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.110.gate_proj.weight": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.110.gate_proj.weight_scale": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.110.up_proj.weight": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.110.up_proj.weight_scale": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.111.down_proj.weight": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.111.down_proj.weight_scale": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.111.gate_proj.weight": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.111.gate_proj.weight_scale": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.111.up_proj.weight": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.111.up_proj.weight_scale": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.112.down_proj.weight": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.112.down_proj.weight_scale": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.112.gate_proj.weight": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.112.gate_proj.weight_scale": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.112.up_proj.weight": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.112.up_proj.weight_scale": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.113.down_proj.weight": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.113.down_proj.weight_scale": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.113.gate_proj.weight": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.113.gate_proj.weight_scale": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.113.up_proj.weight": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.113.up_proj.weight_scale": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.114.down_proj.weight": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.114.down_proj.weight_scale": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.114.gate_proj.weight": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.114.gate_proj.weight_scale": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.114.up_proj.weight": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.114.up_proj.weight_scale": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.115.down_proj.weight": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.115.down_proj.weight_scale": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.115.gate_proj.weight": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.115.gate_proj.weight_scale": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.115.up_proj.weight": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.115.up_proj.weight_scale": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.116.down_proj.weight": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.116.down_proj.weight_scale": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.116.gate_proj.weight": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.116.gate_proj.weight_scale": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.116.up_proj.weight": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.116.up_proj.weight_scale": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.117.down_proj.weight": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.117.down_proj.weight_scale": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.117.gate_proj.weight": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.117.gate_proj.weight_scale": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.117.up_proj.weight": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.117.up_proj.weight_scale": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.118.down_proj.weight": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.118.down_proj.weight_scale": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.118.gate_proj.weight": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.118.gate_proj.weight_scale": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.118.up_proj.weight": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.118.up_proj.weight_scale": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.119.down_proj.weight": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.119.down_proj.weight_scale": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.119.gate_proj.weight": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.119.gate_proj.weight_scale": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.119.up_proj.weight": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.119.up_proj.weight_scale": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.12.down_proj.weight": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.12.down_proj.weight_scale": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.12.gate_proj.weight": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.12.gate_proj.weight_scale": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.12.up_proj.weight": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.12.up_proj.weight_scale": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.120.down_proj.weight": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.120.down_proj.weight_scale": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.120.gate_proj.weight": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.120.gate_proj.weight_scale": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.120.up_proj.weight": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.120.up_proj.weight_scale": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.121.down_proj.weight": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.121.down_proj.weight_scale": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.121.gate_proj.weight": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.121.gate_proj.weight_scale": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.121.up_proj.weight": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.121.up_proj.weight_scale": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.122.down_proj.weight": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.122.down_proj.weight_scale": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.122.gate_proj.weight": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.122.gate_proj.weight_scale": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.122.up_proj.weight": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.122.up_proj.weight_scale": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.123.down_proj.weight": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.123.down_proj.weight_scale": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.123.gate_proj.weight": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.123.gate_proj.weight_scale": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.123.up_proj.weight": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.123.up_proj.weight_scale": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.124.down_proj.weight": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.124.down_proj.weight_scale": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.124.gate_proj.weight": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.124.gate_proj.weight_scale": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.124.up_proj.weight": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.124.up_proj.weight_scale": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.125.down_proj.weight": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.125.down_proj.weight_scale": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.125.gate_proj.weight": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.125.gate_proj.weight_scale": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.125.up_proj.weight": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.125.up_proj.weight_scale": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.126.down_proj.weight": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.126.down_proj.weight_scale": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.126.gate_proj.weight": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.126.gate_proj.weight_scale": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.126.up_proj.weight": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.126.up_proj.weight_scale": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.127.down_proj.weight": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.127.down_proj.weight_scale": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.127.gate_proj.weight": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.127.gate_proj.weight_scale": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.127.up_proj.weight": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.127.up_proj.weight_scale": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.128.down_proj.weight": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.128.down_proj.weight_scale": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.128.gate_proj.weight": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.128.gate_proj.weight_scale": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.128.up_proj.weight": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.128.up_proj.weight_scale": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.129.down_proj.weight": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.129.down_proj.weight_scale": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.129.gate_proj.weight": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.129.gate_proj.weight_scale": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.129.up_proj.weight": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.129.up_proj.weight_scale": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.13.down_proj.weight": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.13.down_proj.weight_scale": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.13.gate_proj.weight": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.13.gate_proj.weight_scale": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.13.up_proj.weight": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.13.up_proj.weight_scale": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.130.down_proj.weight": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.130.down_proj.weight_scale": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.130.gate_proj.weight": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.130.gate_proj.weight_scale": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.130.up_proj.weight": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.130.up_proj.weight_scale": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.131.down_proj.weight": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.131.down_proj.weight_scale": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.131.gate_proj.weight": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.131.gate_proj.weight_scale": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.131.up_proj.weight": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.131.up_proj.weight_scale": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.132.down_proj.weight": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.132.down_proj.weight_scale": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.132.gate_proj.weight": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.132.gate_proj.weight_scale": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.132.up_proj.weight": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.132.up_proj.weight_scale": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.133.down_proj.weight": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.133.down_proj.weight_scale": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.133.gate_proj.weight": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.133.gate_proj.weight_scale": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.133.up_proj.weight": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.133.up_proj.weight_scale": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.134.down_proj.weight": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.134.down_proj.weight_scale": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.134.gate_proj.weight": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.134.gate_proj.weight_scale": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.134.up_proj.weight": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.134.up_proj.weight_scale": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.135.down_proj.weight": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.135.down_proj.weight_scale": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.135.gate_proj.weight": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.135.gate_proj.weight_scale": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.135.up_proj.weight": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.135.up_proj.weight_scale": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.136.down_proj.weight": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.136.down_proj.weight_scale": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.136.gate_proj.weight": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.136.gate_proj.weight_scale": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.136.up_proj.weight": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.136.up_proj.weight_scale": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.137.down_proj.weight": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.137.down_proj.weight_scale": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.137.gate_proj.weight": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.137.gate_proj.weight_scale": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.137.up_proj.weight": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.137.up_proj.weight_scale": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.138.down_proj.weight": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.138.down_proj.weight_scale": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.138.gate_proj.weight": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.138.gate_proj.weight_scale": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.138.up_proj.weight": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.138.up_proj.weight_scale": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.139.down_proj.weight": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.139.down_proj.weight_scale": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.139.gate_proj.weight": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.139.gate_proj.weight_scale": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.139.up_proj.weight": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.139.up_proj.weight_scale": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.14.down_proj.weight": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.14.down_proj.weight_scale": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.14.gate_proj.weight": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.14.gate_proj.weight_scale": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.14.up_proj.weight": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.14.up_proj.weight_scale": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.140.down_proj.weight": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.140.down_proj.weight_scale": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.140.gate_proj.weight": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.140.gate_proj.weight_scale": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.140.up_proj.weight": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.140.up_proj.weight_scale": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.141.down_proj.weight": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.141.down_proj.weight_scale": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.141.gate_proj.weight": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.141.gate_proj.weight_scale": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.141.up_proj.weight": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.141.up_proj.weight_scale": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.142.down_proj.weight": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.142.down_proj.weight_scale": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.142.gate_proj.weight": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.142.gate_proj.weight_scale": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.142.up_proj.weight": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.142.up_proj.weight_scale": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.143.down_proj.weight": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.143.down_proj.weight_scale": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.143.gate_proj.weight": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.143.gate_proj.weight_scale": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.143.up_proj.weight": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.143.up_proj.weight_scale": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.144.down_proj.weight": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.144.down_proj.weight_scale": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.144.gate_proj.weight": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.144.gate_proj.weight_scale": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.144.up_proj.weight": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.144.up_proj.weight_scale": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.145.down_proj.weight": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.145.down_proj.weight_scale": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.145.gate_proj.weight": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.145.gate_proj.weight_scale": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.145.up_proj.weight": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.145.up_proj.weight_scale": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.146.down_proj.weight": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.146.down_proj.weight_scale": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.146.gate_proj.weight": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.146.gate_proj.weight_scale": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.146.up_proj.weight": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.146.up_proj.weight_scale": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.147.down_proj.weight": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.147.down_proj.weight_scale": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.147.gate_proj.weight": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.147.gate_proj.weight_scale": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.147.up_proj.weight": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.147.up_proj.weight_scale": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.148.down_proj.weight": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.148.down_proj.weight_scale": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.148.gate_proj.weight": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.148.gate_proj.weight_scale": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.148.up_proj.weight": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.148.up_proj.weight_scale": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.149.down_proj.weight": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.149.down_proj.weight_scale": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.149.gate_proj.weight": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.149.gate_proj.weight_scale": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.149.up_proj.weight": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.149.up_proj.weight_scale": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.15.down_proj.weight": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.15.down_proj.weight_scale": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.15.gate_proj.weight": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.15.gate_proj.weight_scale": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.15.up_proj.weight": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.15.up_proj.weight_scale": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.150.down_proj.weight": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.150.down_proj.weight_scale": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.150.gate_proj.weight": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.150.gate_proj.weight_scale": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.150.up_proj.weight": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.150.up_proj.weight_scale": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.151.down_proj.weight": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.151.down_proj.weight_scale": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.151.gate_proj.weight": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.151.gate_proj.weight_scale": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.151.up_proj.weight": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.151.up_proj.weight_scale": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.152.down_proj.weight": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.152.down_proj.weight_scale": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.152.gate_proj.weight": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.152.gate_proj.weight_scale": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.152.up_proj.weight": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.152.up_proj.weight_scale": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.153.down_proj.weight": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.153.down_proj.weight_scale": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.153.gate_proj.weight": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.153.gate_proj.weight_scale": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.153.up_proj.weight": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.153.up_proj.weight_scale": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.154.down_proj.weight": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.154.down_proj.weight_scale": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.154.gate_proj.weight": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.154.gate_proj.weight_scale": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.154.up_proj.weight": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.154.up_proj.weight_scale": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.155.down_proj.weight": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.155.down_proj.weight_scale": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.155.gate_proj.weight": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.155.gate_proj.weight_scale": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.155.up_proj.weight": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.155.up_proj.weight_scale": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.156.down_proj.weight": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.156.down_proj.weight_scale": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.156.gate_proj.weight": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.156.gate_proj.weight_scale": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.156.up_proj.weight": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.156.up_proj.weight_scale": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.157.down_proj.weight": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.157.down_proj.weight_scale": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.157.gate_proj.weight": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.157.gate_proj.weight_scale": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.157.up_proj.weight": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.157.up_proj.weight_scale": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.158.down_proj.weight": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.158.down_proj.weight_scale": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.158.gate_proj.weight": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.158.gate_proj.weight_scale": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.158.up_proj.weight": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.158.up_proj.weight_scale": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.159.down_proj.weight": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.159.down_proj.weight_scale": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.159.gate_proj.weight": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.159.gate_proj.weight_scale": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.159.up_proj.weight": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.159.up_proj.weight_scale": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.16.down_proj.weight": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.16.down_proj.weight_scale": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.16.gate_proj.weight": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.16.gate_proj.weight_scale": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.16.up_proj.weight": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.16.up_proj.weight_scale": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.17.down_proj.weight": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.17.down_proj.weight_scale": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.17.gate_proj.weight": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.17.gate_proj.weight_scale": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.17.up_proj.weight": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.17.up_proj.weight_scale": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.18.down_proj.weight": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.18.down_proj.weight_scale": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.18.gate_proj.weight": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.18.gate_proj.weight_scale": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.18.up_proj.weight": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.18.up_proj.weight_scale": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.19.down_proj.weight": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.19.down_proj.weight_scale": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.19.gate_proj.weight": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.19.gate_proj.weight_scale": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.19.up_proj.weight": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.19.up_proj.weight_scale": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.2.down_proj.weight": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.2.down_proj.weight_scale": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.2.gate_proj.weight": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.2.gate_proj.weight_scale": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.2.up_proj.weight": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.2.up_proj.weight_scale": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.20.down_proj.weight": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.20.down_proj.weight_scale": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.20.gate_proj.weight": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.20.gate_proj.weight_scale": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.20.up_proj.weight": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.20.up_proj.weight_scale": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.21.down_proj.weight": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.21.down_proj.weight_scale": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.21.gate_proj.weight": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.21.gate_proj.weight_scale": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.21.up_proj.weight": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.21.up_proj.weight_scale": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.22.down_proj.weight": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.22.down_proj.weight_scale": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.22.gate_proj.weight": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.22.gate_proj.weight_scale": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.22.up_proj.weight": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.22.up_proj.weight_scale": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.23.down_proj.weight": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.23.down_proj.weight_scale": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.23.gate_proj.weight": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.23.gate_proj.weight_scale": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.23.up_proj.weight": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.23.up_proj.weight_scale": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.24.down_proj.weight": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.24.down_proj.weight_scale": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.24.gate_proj.weight": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.24.gate_proj.weight_scale": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.24.up_proj.weight": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.24.up_proj.weight_scale": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.25.down_proj.weight": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.25.down_proj.weight_scale": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.25.gate_proj.weight": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.25.gate_proj.weight_scale": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.25.up_proj.weight": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.25.up_proj.weight_scale": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.26.down_proj.weight": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.26.down_proj.weight_scale": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.26.gate_proj.weight": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.26.gate_proj.weight_scale": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.26.up_proj.weight": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.26.up_proj.weight_scale": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.27.down_proj.weight": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.27.down_proj.weight_scale": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.27.gate_proj.weight": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.27.gate_proj.weight_scale": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.27.up_proj.weight": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.27.up_proj.weight_scale": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.28.down_proj.weight": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.28.down_proj.weight_scale": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.28.gate_proj.weight": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.28.gate_proj.weight_scale": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.28.up_proj.weight": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.28.up_proj.weight_scale": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.29.down_proj.weight": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.29.down_proj.weight_scale": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.29.gate_proj.weight": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.29.gate_proj.weight_scale": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.29.up_proj.weight": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.29.up_proj.weight_scale": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.3.down_proj.weight": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.3.down_proj.weight_scale": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.3.gate_proj.weight": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.3.gate_proj.weight_scale": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.3.up_proj.weight": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.3.up_proj.weight_scale": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.30.down_proj.weight": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.30.down_proj.weight_scale": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.30.gate_proj.weight": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.30.gate_proj.weight_scale": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.30.up_proj.weight": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.30.up_proj.weight_scale": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.31.down_proj.weight": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.31.down_proj.weight_scale": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.31.gate_proj.weight": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.31.gate_proj.weight_scale": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.31.up_proj.weight": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.31.up_proj.weight_scale": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.32.down_proj.weight": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.32.down_proj.weight_scale": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.32.gate_proj.weight": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.32.gate_proj.weight_scale": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.32.up_proj.weight": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.32.up_proj.weight_scale": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.33.down_proj.weight": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.33.down_proj.weight_scale": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.33.gate_proj.weight": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.33.gate_proj.weight_scale": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.33.up_proj.weight": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.33.up_proj.weight_scale": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.34.down_proj.weight": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.34.down_proj.weight_scale": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.34.gate_proj.weight": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.34.gate_proj.weight_scale": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.34.up_proj.weight": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.34.up_proj.weight_scale": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.35.down_proj.weight": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.35.down_proj.weight_scale": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.35.gate_proj.weight": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.35.gate_proj.weight_scale": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.35.up_proj.weight": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.35.up_proj.weight_scale": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.36.down_proj.weight": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.36.down_proj.weight_scale": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.36.gate_proj.weight": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.36.gate_proj.weight_scale": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.36.up_proj.weight": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.36.up_proj.weight_scale": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.37.down_proj.weight": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.37.down_proj.weight_scale": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.37.gate_proj.weight": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.37.gate_proj.weight_scale": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.37.up_proj.weight": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.37.up_proj.weight_scale": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.38.down_proj.weight": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.38.down_proj.weight_scale": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.38.gate_proj.weight": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.38.gate_proj.weight_scale": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.38.up_proj.weight": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.38.up_proj.weight_scale": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.39.down_proj.weight": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.39.down_proj.weight_scale": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.39.gate_proj.weight": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.39.gate_proj.weight_scale": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.39.up_proj.weight": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.39.up_proj.weight_scale": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.4.down_proj.weight": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.4.down_proj.weight_scale": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.4.gate_proj.weight": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.4.gate_proj.weight_scale": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.4.up_proj.weight": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.4.up_proj.weight_scale": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.40.down_proj.weight": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.40.down_proj.weight_scale": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.40.gate_proj.weight": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.40.gate_proj.weight_scale": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.40.up_proj.weight": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.40.up_proj.weight_scale": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.41.down_proj.weight": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.41.down_proj.weight_scale": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.41.gate_proj.weight": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.41.gate_proj.weight_scale": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.41.up_proj.weight": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.41.up_proj.weight_scale": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.42.down_proj.weight": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.42.down_proj.weight_scale": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.42.gate_proj.weight": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.42.gate_proj.weight_scale": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.42.up_proj.weight": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.42.up_proj.weight_scale": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.43.down_proj.weight": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.43.down_proj.weight_scale": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.43.gate_proj.weight": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.43.gate_proj.weight_scale": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.43.up_proj.weight": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.43.up_proj.weight_scale": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.44.down_proj.weight": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.44.down_proj.weight_scale": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.44.gate_proj.weight": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.44.gate_proj.weight_scale": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.44.up_proj.weight": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.44.up_proj.weight_scale": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.45.down_proj.weight": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.45.down_proj.weight_scale": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.45.gate_proj.weight": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.45.gate_proj.weight_scale": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.45.up_proj.weight": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.45.up_proj.weight_scale": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.46.down_proj.weight": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.46.down_proj.weight_scale": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.46.gate_proj.weight": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.46.gate_proj.weight_scale": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.46.up_proj.weight": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.46.up_proj.weight_scale": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.47.down_proj.weight": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.47.down_proj.weight_scale": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.47.gate_proj.weight": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.47.gate_proj.weight_scale": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.47.up_proj.weight": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.47.up_proj.weight_scale": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.48.down_proj.weight": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.48.down_proj.weight_scale": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.48.gate_proj.weight": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.48.gate_proj.weight_scale": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.48.up_proj.weight": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.48.up_proj.weight_scale": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.49.down_proj.weight": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.49.down_proj.weight_scale": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.49.gate_proj.weight": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.49.gate_proj.weight_scale": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.49.up_proj.weight": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.49.up_proj.weight_scale": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.5.down_proj.weight": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.5.down_proj.weight_scale": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.5.gate_proj.weight": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.5.gate_proj.weight_scale": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.5.up_proj.weight": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.5.up_proj.weight_scale": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.50.down_proj.weight": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.50.down_proj.weight_scale": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.50.gate_proj.weight": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.50.gate_proj.weight_scale": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.50.up_proj.weight": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.50.up_proj.weight_scale": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.51.down_proj.weight": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.51.down_proj.weight_scale": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.51.gate_proj.weight": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.51.gate_proj.weight_scale": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.51.up_proj.weight": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.51.up_proj.weight_scale": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.52.down_proj.weight": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.52.down_proj.weight_scale": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.52.gate_proj.weight": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.52.gate_proj.weight_scale": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.52.up_proj.weight": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.52.up_proj.weight_scale": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.53.down_proj.weight": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.53.down_proj.weight_scale": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.53.gate_proj.weight": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.53.gate_proj.weight_scale": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.53.up_proj.weight": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.53.up_proj.weight_scale": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.54.down_proj.weight": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.54.down_proj.weight_scale": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.54.gate_proj.weight": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.54.gate_proj.weight_scale": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.54.up_proj.weight": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.54.up_proj.weight_scale": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.55.down_proj.weight": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.55.down_proj.weight_scale": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.55.gate_proj.weight": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.55.gate_proj.weight_scale": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.55.up_proj.weight": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.55.up_proj.weight_scale": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.56.down_proj.weight": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.56.down_proj.weight_scale": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.56.gate_proj.weight": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.56.gate_proj.weight_scale": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.56.up_proj.weight": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.56.up_proj.weight_scale": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.57.down_proj.weight": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.57.down_proj.weight_scale": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.57.gate_proj.weight": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.57.gate_proj.weight_scale": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.57.up_proj.weight": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.57.up_proj.weight_scale": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.58.down_proj.weight": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.58.down_proj.weight_scale": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.58.gate_proj.weight": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.58.gate_proj.weight_scale": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.58.up_proj.weight": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.58.up_proj.weight_scale": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.59.down_proj.weight": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.59.down_proj.weight_scale": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.59.gate_proj.weight": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.59.gate_proj.weight_scale": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.59.up_proj.weight": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.59.up_proj.weight_scale": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.6.down_proj.weight": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.6.down_proj.weight_scale": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.6.gate_proj.weight": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.6.gate_proj.weight_scale": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.6.up_proj.weight": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.6.up_proj.weight_scale": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.60.down_proj.weight": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.60.down_proj.weight_scale": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.60.gate_proj.weight": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.60.gate_proj.weight_scale": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.60.up_proj.weight": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.60.up_proj.weight_scale": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.61.down_proj.weight": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.61.down_proj.weight_scale": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.61.gate_proj.weight": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.61.gate_proj.weight_scale": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.61.up_proj.weight": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.61.up_proj.weight_scale": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.62.down_proj.weight": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.62.down_proj.weight_scale": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.62.gate_proj.weight": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.62.gate_proj.weight_scale": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.62.up_proj.weight": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.62.up_proj.weight_scale": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.63.down_proj.weight": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.63.down_proj.weight_scale": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.63.gate_proj.weight": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.63.gate_proj.weight_scale": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.63.up_proj.weight": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.63.up_proj.weight_scale": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.64.down_proj.weight": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.64.down_proj.weight_scale": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.64.gate_proj.weight": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.64.gate_proj.weight_scale": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.64.up_proj.weight": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.64.up_proj.weight_scale": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.65.down_proj.weight": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.65.down_proj.weight_scale": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.65.gate_proj.weight": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.65.gate_proj.weight_scale": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.65.up_proj.weight": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.65.up_proj.weight_scale": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.66.down_proj.weight": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.66.down_proj.weight_scale": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.66.gate_proj.weight": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.66.gate_proj.weight_scale": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.66.up_proj.weight": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.66.up_proj.weight_scale": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.67.down_proj.weight": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.67.down_proj.weight_scale": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.67.gate_proj.weight": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.67.gate_proj.weight_scale": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.67.up_proj.weight": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.67.up_proj.weight_scale": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.68.down_proj.weight": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.68.down_proj.weight_scale": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.68.gate_proj.weight": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.68.gate_proj.weight_scale": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.68.up_proj.weight": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.68.up_proj.weight_scale": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.69.down_proj.weight": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.69.down_proj.weight_scale": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.69.gate_proj.weight": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.69.gate_proj.weight_scale": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.69.up_proj.weight": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.69.up_proj.weight_scale": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.7.down_proj.weight": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.7.down_proj.weight_scale": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.7.gate_proj.weight": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.7.gate_proj.weight_scale": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.7.up_proj.weight": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.7.up_proj.weight_scale": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.70.down_proj.weight": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.70.down_proj.weight_scale": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.70.gate_proj.weight": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.70.gate_proj.weight_scale": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.70.up_proj.weight": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.70.up_proj.weight_scale": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.71.down_proj.weight": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.71.down_proj.weight_scale": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.71.gate_proj.weight": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.71.gate_proj.weight_scale": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.71.up_proj.weight": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.71.up_proj.weight_scale": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.72.down_proj.weight": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.72.down_proj.weight_scale": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.72.gate_proj.weight": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.72.gate_proj.weight_scale": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.72.up_proj.weight": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.72.up_proj.weight_scale": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.73.down_proj.weight": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.73.down_proj.weight_scale": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.73.gate_proj.weight": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.73.gate_proj.weight_scale": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.73.up_proj.weight": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.73.up_proj.weight_scale": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.74.down_proj.weight": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.74.down_proj.weight_scale": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.74.gate_proj.weight": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.74.gate_proj.weight_scale": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.74.up_proj.weight": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.74.up_proj.weight_scale": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.75.down_proj.weight": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.75.down_proj.weight_scale": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.75.gate_proj.weight": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.75.gate_proj.weight_scale": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.75.up_proj.weight": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.75.up_proj.weight_scale": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.76.down_proj.weight": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.76.down_proj.weight_scale": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.76.gate_proj.weight": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.76.gate_proj.weight_scale": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.76.up_proj.weight": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.76.up_proj.weight_scale": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.77.down_proj.weight": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.77.down_proj.weight_scale": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.77.gate_proj.weight": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.77.gate_proj.weight_scale": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.77.up_proj.weight": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.77.up_proj.weight_scale": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.78.down_proj.weight": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.78.down_proj.weight_scale": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.78.gate_proj.weight": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.78.gate_proj.weight_scale": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.78.up_proj.weight": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.78.up_proj.weight_scale": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.79.down_proj.weight": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.79.down_proj.weight_scale": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.79.gate_proj.weight": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.79.gate_proj.weight_scale": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.79.up_proj.weight": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.79.up_proj.weight_scale": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.8.down_proj.weight": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.8.down_proj.weight_scale": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.8.gate_proj.weight": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.8.gate_proj.weight_scale": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.8.up_proj.weight": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.8.up_proj.weight_scale": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.80.down_proj.weight": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.80.down_proj.weight_scale": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.80.gate_proj.weight": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.80.gate_proj.weight_scale": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.80.up_proj.weight": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.80.up_proj.weight_scale": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.81.down_proj.weight": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.81.down_proj.weight_scale": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.81.gate_proj.weight": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.81.gate_proj.weight_scale": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.81.up_proj.weight": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.81.up_proj.weight_scale": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.82.down_proj.weight": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.82.down_proj.weight_scale": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.82.gate_proj.weight": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.82.gate_proj.weight_scale": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.82.up_proj.weight": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.82.up_proj.weight_scale": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.83.down_proj.weight": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.83.down_proj.weight_scale": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.83.gate_proj.weight": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.83.gate_proj.weight_scale": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.83.up_proj.weight": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.83.up_proj.weight_scale": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.84.down_proj.weight": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.84.down_proj.weight_scale": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.84.gate_proj.weight": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.84.gate_proj.weight_scale": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.84.up_proj.weight": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.84.up_proj.weight_scale": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.85.down_proj.weight": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.85.down_proj.weight_scale": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.85.gate_proj.weight": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.85.gate_proj.weight_scale": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.85.up_proj.weight": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.85.up_proj.weight_scale": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.86.down_proj.weight": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.86.down_proj.weight_scale": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.86.gate_proj.weight": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.86.gate_proj.weight_scale": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.86.up_proj.weight": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.86.up_proj.weight_scale": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.87.down_proj.weight": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.87.down_proj.weight_scale": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.87.gate_proj.weight": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.87.gate_proj.weight_scale": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.87.up_proj.weight": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.87.up_proj.weight_scale": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.88.down_proj.weight": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.88.down_proj.weight_scale": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.88.gate_proj.weight": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.88.gate_proj.weight_scale": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.88.up_proj.weight": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.88.up_proj.weight_scale": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.89.down_proj.weight": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.89.down_proj.weight_scale": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.89.gate_proj.weight": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.89.gate_proj.weight_scale": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.89.up_proj.weight": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.89.up_proj.weight_scale": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.9.down_proj.weight": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.9.down_proj.weight_scale": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.9.gate_proj.weight": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.9.gate_proj.weight_scale": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.9.up_proj.weight": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.9.up_proj.weight_scale": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.90.down_proj.weight": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.90.down_proj.weight_scale": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.90.gate_proj.weight": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.90.gate_proj.weight_scale": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.90.up_proj.weight": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.90.up_proj.weight_scale": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.91.down_proj.weight": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.91.down_proj.weight_scale": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.91.gate_proj.weight": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.91.gate_proj.weight_scale": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.91.up_proj.weight": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.91.up_proj.weight_scale": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.92.down_proj.weight": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.92.down_proj.weight_scale": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.92.gate_proj.weight": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.92.gate_proj.weight_scale": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.92.up_proj.weight": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.92.up_proj.weight_scale": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.93.down_proj.weight": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.93.down_proj.weight_scale": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.93.gate_proj.weight": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.93.gate_proj.weight_scale": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.93.up_proj.weight": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.93.up_proj.weight_scale": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.94.down_proj.weight": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.94.down_proj.weight_scale": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.94.gate_proj.weight": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.94.gate_proj.weight_scale": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.94.up_proj.weight": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.94.up_proj.weight_scale": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.95.down_proj.weight": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.95.down_proj.weight_scale": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.95.gate_proj.weight": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.95.gate_proj.weight_scale": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.95.up_proj.weight": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.95.up_proj.weight_scale": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.96.down_proj.weight": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.96.down_proj.weight_scale": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.96.gate_proj.weight": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.96.gate_proj.weight_scale": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.96.up_proj.weight": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.96.up_proj.weight_scale": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.97.down_proj.weight": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.97.down_proj.weight_scale": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.97.gate_proj.weight": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.97.gate_proj.weight_scale": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.97.up_proj.weight": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.97.up_proj.weight_scale": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.98.down_proj.weight": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.98.down_proj.weight_scale": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.98.gate_proj.weight": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.98.gate_proj.weight_scale": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.98.up_proj.weight": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.98.up_proj.weight_scale": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.99.down_proj.weight": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.99.down_proj.weight_scale": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.99.gate_proj.weight": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.99.gate_proj.weight_scale": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.99.up_proj.weight": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.99.up_proj.weight_scale": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.gate.e_score_correction_bias": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.gate.weight": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.shared_experts.down_proj.weight": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.shared_experts.down_proj.weight_scale": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.shared_experts.gate_proj.weight": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.shared_experts.gate_proj.weight_scale": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.shared_experts.up_proj.weight": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.shared_experts.up_proj.weight_scale": "model-00032-of-00092.safetensors",
+ "model.layers.31.post_attention_layernorm.weight": "model-00032-of-00092.safetensors",
+ "model.layers.31.self_attn.k_norm.weight": "model-00032-of-00092.safetensors",
+ "model.layers.31.self_attn.k_proj.bias": "model-00032-of-00092.safetensors",
+ "model.layers.31.self_attn.k_proj.weight": "model-00032-of-00092.safetensors",
+ "model.layers.31.self_attn.k_proj.weight_scale": "model-00032-of-00092.safetensors",
+ "model.layers.31.self_attn.o_proj.weight": "model-00032-of-00092.safetensors",
+ "model.layers.31.self_attn.o_proj.weight_scale": "model-00032-of-00092.safetensors",
+ "model.layers.31.self_attn.q_norm.weight": "model-00032-of-00092.safetensors",
+ "model.layers.31.self_attn.q_proj.bias": "model-00032-of-00092.safetensors",
+ "model.layers.31.self_attn.q_proj.weight": "model-00032-of-00092.safetensors",
+ "model.layers.31.self_attn.q_proj.weight_scale": "model-00032-of-00092.safetensors",
+ "model.layers.31.self_attn.v_proj.bias": "model-00032-of-00092.safetensors",
+ "model.layers.31.self_attn.v_proj.weight": "model-00032-of-00092.safetensors",
+ "model.layers.31.self_attn.v_proj.weight_scale": "model-00032-of-00092.safetensors",
+ "model.layers.32.input_layernorm.weight": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.0.down_proj.weight": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.0.down_proj.weight_scale": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.0.gate_proj.weight": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.0.gate_proj.weight_scale": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.0.up_proj.weight": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.0.up_proj.weight_scale": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.1.down_proj.weight": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.1.down_proj.weight_scale": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.1.gate_proj.weight": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.1.gate_proj.weight_scale": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.1.up_proj.weight": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.1.up_proj.weight_scale": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.10.down_proj.weight": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.10.down_proj.weight_scale": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.10.gate_proj.weight": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.10.gate_proj.weight_scale": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.10.up_proj.weight": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.10.up_proj.weight_scale": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.100.down_proj.weight": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.100.down_proj.weight_scale": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.100.gate_proj.weight": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.100.gate_proj.weight_scale": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.100.up_proj.weight": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.100.up_proj.weight_scale": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.101.down_proj.weight": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.101.down_proj.weight_scale": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.101.gate_proj.weight": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.101.gate_proj.weight_scale": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.101.up_proj.weight": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.101.up_proj.weight_scale": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.102.down_proj.weight": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.102.down_proj.weight_scale": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.102.gate_proj.weight": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.102.gate_proj.weight_scale": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.102.up_proj.weight": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.102.up_proj.weight_scale": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.103.down_proj.weight": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.103.down_proj.weight_scale": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.103.gate_proj.weight": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.103.gate_proj.weight_scale": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.103.up_proj.weight": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.103.up_proj.weight_scale": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.104.down_proj.weight": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.104.down_proj.weight_scale": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.104.gate_proj.weight": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.104.gate_proj.weight_scale": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.104.up_proj.weight": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.104.up_proj.weight_scale": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.105.down_proj.weight": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.105.down_proj.weight_scale": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.105.gate_proj.weight": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.105.gate_proj.weight_scale": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.105.up_proj.weight": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.105.up_proj.weight_scale": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.106.down_proj.weight": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.106.down_proj.weight_scale": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.106.gate_proj.weight": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.106.gate_proj.weight_scale": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.106.up_proj.weight": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.106.up_proj.weight_scale": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.107.down_proj.weight": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.107.down_proj.weight_scale": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.107.gate_proj.weight": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.107.gate_proj.weight_scale": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.107.up_proj.weight": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.107.up_proj.weight_scale": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.108.down_proj.weight": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.108.down_proj.weight_scale": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.108.gate_proj.weight": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.108.gate_proj.weight_scale": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.108.up_proj.weight": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.108.up_proj.weight_scale": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.109.down_proj.weight": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.109.down_proj.weight_scale": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.109.gate_proj.weight": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.109.gate_proj.weight_scale": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.109.up_proj.weight": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.109.up_proj.weight_scale": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.11.down_proj.weight": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.11.down_proj.weight_scale": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.11.gate_proj.weight": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.11.gate_proj.weight_scale": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.11.up_proj.weight": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.11.up_proj.weight_scale": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.110.down_proj.weight": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.110.down_proj.weight_scale": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.110.gate_proj.weight": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.110.gate_proj.weight_scale": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.110.up_proj.weight": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.110.up_proj.weight_scale": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.111.down_proj.weight": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.111.down_proj.weight_scale": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.111.gate_proj.weight": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.111.gate_proj.weight_scale": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.111.up_proj.weight": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.111.up_proj.weight_scale": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.112.down_proj.weight": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.112.down_proj.weight_scale": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.112.gate_proj.weight": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.112.gate_proj.weight_scale": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.112.up_proj.weight": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.112.up_proj.weight_scale": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.113.down_proj.weight": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.113.down_proj.weight_scale": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.113.gate_proj.weight": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.113.gate_proj.weight_scale": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.113.up_proj.weight": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.113.up_proj.weight_scale": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.114.down_proj.weight": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.114.down_proj.weight_scale": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.114.gate_proj.weight": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.114.gate_proj.weight_scale": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.114.up_proj.weight": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.114.up_proj.weight_scale": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.115.down_proj.weight": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.115.down_proj.weight_scale": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.115.gate_proj.weight": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.115.gate_proj.weight_scale": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.115.up_proj.weight": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.115.up_proj.weight_scale": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.116.down_proj.weight": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.116.down_proj.weight_scale": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.116.gate_proj.weight": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.116.gate_proj.weight_scale": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.116.up_proj.weight": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.116.up_proj.weight_scale": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.117.down_proj.weight": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.117.down_proj.weight_scale": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.117.gate_proj.weight": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.117.gate_proj.weight_scale": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.117.up_proj.weight": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.117.up_proj.weight_scale": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.118.down_proj.weight": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.118.down_proj.weight_scale": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.118.gate_proj.weight": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.118.gate_proj.weight_scale": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.118.up_proj.weight": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.118.up_proj.weight_scale": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.119.down_proj.weight": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.119.down_proj.weight_scale": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.119.gate_proj.weight": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.119.gate_proj.weight_scale": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.119.up_proj.weight": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.119.up_proj.weight_scale": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.12.down_proj.weight": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.12.down_proj.weight_scale": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.12.gate_proj.weight": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.12.gate_proj.weight_scale": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.12.up_proj.weight": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.12.up_proj.weight_scale": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.120.down_proj.weight": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.120.down_proj.weight_scale": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.120.gate_proj.weight": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.120.gate_proj.weight_scale": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.120.up_proj.weight": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.120.up_proj.weight_scale": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.121.down_proj.weight": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.121.down_proj.weight_scale": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.121.gate_proj.weight": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.121.gate_proj.weight_scale": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.121.up_proj.weight": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.121.up_proj.weight_scale": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.122.down_proj.weight": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.122.down_proj.weight_scale": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.122.gate_proj.weight": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.122.gate_proj.weight_scale": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.122.up_proj.weight": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.122.up_proj.weight_scale": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.123.down_proj.weight": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.123.down_proj.weight_scale": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.123.gate_proj.weight": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.123.gate_proj.weight_scale": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.123.up_proj.weight": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.123.up_proj.weight_scale": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.124.down_proj.weight": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.124.down_proj.weight_scale": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.124.gate_proj.weight": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.124.gate_proj.weight_scale": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.124.up_proj.weight": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.124.up_proj.weight_scale": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.125.down_proj.weight": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.125.down_proj.weight_scale": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.125.gate_proj.weight": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.125.gate_proj.weight_scale": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.125.up_proj.weight": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.125.up_proj.weight_scale": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.126.down_proj.weight": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.126.down_proj.weight_scale": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.126.gate_proj.weight": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.126.gate_proj.weight_scale": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.126.up_proj.weight": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.126.up_proj.weight_scale": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.127.down_proj.weight": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.127.down_proj.weight_scale": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.127.gate_proj.weight": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.127.gate_proj.weight_scale": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.127.up_proj.weight": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.127.up_proj.weight_scale": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.128.down_proj.weight": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.128.down_proj.weight_scale": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.128.gate_proj.weight": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.128.gate_proj.weight_scale": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.128.up_proj.weight": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.128.up_proj.weight_scale": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.129.down_proj.weight": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.129.down_proj.weight_scale": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.129.gate_proj.weight": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.129.gate_proj.weight_scale": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.129.up_proj.weight": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.129.up_proj.weight_scale": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.13.down_proj.weight": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.13.down_proj.weight_scale": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.13.gate_proj.weight": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.13.gate_proj.weight_scale": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.13.up_proj.weight": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.13.up_proj.weight_scale": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.130.down_proj.weight": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.130.down_proj.weight_scale": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.130.gate_proj.weight": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.130.gate_proj.weight_scale": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.130.up_proj.weight": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.130.up_proj.weight_scale": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.131.down_proj.weight": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.131.down_proj.weight_scale": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.131.gate_proj.weight": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.131.gate_proj.weight_scale": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.131.up_proj.weight": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.131.up_proj.weight_scale": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.132.down_proj.weight": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.132.down_proj.weight_scale": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.132.gate_proj.weight": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.132.gate_proj.weight_scale": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.132.up_proj.weight": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.132.up_proj.weight_scale": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.133.down_proj.weight": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.133.down_proj.weight_scale": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.133.gate_proj.weight": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.133.gate_proj.weight_scale": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.133.up_proj.weight": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.133.up_proj.weight_scale": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.134.down_proj.weight": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.134.down_proj.weight_scale": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.134.gate_proj.weight": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.134.gate_proj.weight_scale": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.134.up_proj.weight": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.134.up_proj.weight_scale": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.135.down_proj.weight": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.135.down_proj.weight_scale": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.135.gate_proj.weight": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.135.gate_proj.weight_scale": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.135.up_proj.weight": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.135.up_proj.weight_scale": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.136.down_proj.weight": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.136.down_proj.weight_scale": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.136.gate_proj.weight": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.136.gate_proj.weight_scale": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.136.up_proj.weight": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.136.up_proj.weight_scale": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.137.down_proj.weight": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.137.down_proj.weight_scale": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.137.gate_proj.weight": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.137.gate_proj.weight_scale": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.137.up_proj.weight": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.137.up_proj.weight_scale": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.138.down_proj.weight": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.138.down_proj.weight_scale": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.138.gate_proj.weight": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.138.gate_proj.weight_scale": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.138.up_proj.weight": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.138.up_proj.weight_scale": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.139.down_proj.weight": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.139.down_proj.weight_scale": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.139.gate_proj.weight": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.139.gate_proj.weight_scale": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.139.up_proj.weight": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.139.up_proj.weight_scale": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.14.down_proj.weight": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.14.down_proj.weight_scale": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.14.gate_proj.weight": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.14.gate_proj.weight_scale": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.14.up_proj.weight": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.14.up_proj.weight_scale": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.140.down_proj.weight": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.140.down_proj.weight_scale": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.140.gate_proj.weight": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.140.gate_proj.weight_scale": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.140.up_proj.weight": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.140.up_proj.weight_scale": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.141.down_proj.weight": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.141.down_proj.weight_scale": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.141.gate_proj.weight": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.141.gate_proj.weight_scale": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.141.up_proj.weight": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.141.up_proj.weight_scale": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.142.down_proj.weight": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.142.down_proj.weight_scale": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.142.gate_proj.weight": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.142.gate_proj.weight_scale": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.142.up_proj.weight": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.142.up_proj.weight_scale": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.143.down_proj.weight": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.143.down_proj.weight_scale": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.143.gate_proj.weight": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.143.gate_proj.weight_scale": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.143.up_proj.weight": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.143.up_proj.weight_scale": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.144.down_proj.weight": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.144.down_proj.weight_scale": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.144.gate_proj.weight": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.144.gate_proj.weight_scale": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.144.up_proj.weight": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.144.up_proj.weight_scale": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.145.down_proj.weight": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.145.down_proj.weight_scale": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.145.gate_proj.weight": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.145.gate_proj.weight_scale": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.145.up_proj.weight": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.145.up_proj.weight_scale": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.146.down_proj.weight": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.146.down_proj.weight_scale": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.146.gate_proj.weight": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.146.gate_proj.weight_scale": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.146.up_proj.weight": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.146.up_proj.weight_scale": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.147.down_proj.weight": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.147.down_proj.weight_scale": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.147.gate_proj.weight": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.147.gate_proj.weight_scale": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.147.up_proj.weight": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.147.up_proj.weight_scale": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.148.down_proj.weight": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.148.down_proj.weight_scale": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.148.gate_proj.weight": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.148.gate_proj.weight_scale": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.148.up_proj.weight": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.148.up_proj.weight_scale": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.149.down_proj.weight": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.149.down_proj.weight_scale": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.149.gate_proj.weight": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.149.gate_proj.weight_scale": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.149.up_proj.weight": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.149.up_proj.weight_scale": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.15.down_proj.weight": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.15.down_proj.weight_scale": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.15.gate_proj.weight": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.15.gate_proj.weight_scale": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.15.up_proj.weight": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.15.up_proj.weight_scale": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.150.down_proj.weight": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.150.down_proj.weight_scale": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.150.gate_proj.weight": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.150.gate_proj.weight_scale": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.150.up_proj.weight": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.150.up_proj.weight_scale": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.151.down_proj.weight": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.151.down_proj.weight_scale": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.151.gate_proj.weight": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.151.gate_proj.weight_scale": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.151.up_proj.weight": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.151.up_proj.weight_scale": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.152.down_proj.weight": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.152.down_proj.weight_scale": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.152.gate_proj.weight": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.152.gate_proj.weight_scale": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.152.up_proj.weight": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.152.up_proj.weight_scale": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.153.down_proj.weight": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.153.down_proj.weight_scale": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.153.gate_proj.weight": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.153.gate_proj.weight_scale": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.153.up_proj.weight": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.153.up_proj.weight_scale": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.154.down_proj.weight": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.154.down_proj.weight_scale": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.154.gate_proj.weight": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.154.gate_proj.weight_scale": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.154.up_proj.weight": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.154.up_proj.weight_scale": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.155.down_proj.weight": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.155.down_proj.weight_scale": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.155.gate_proj.weight": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.155.gate_proj.weight_scale": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.155.up_proj.weight": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.155.up_proj.weight_scale": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.156.down_proj.weight": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.156.down_proj.weight_scale": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.156.gate_proj.weight": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.156.gate_proj.weight_scale": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.156.up_proj.weight": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.156.up_proj.weight_scale": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.157.down_proj.weight": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.157.down_proj.weight_scale": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.157.gate_proj.weight": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.157.gate_proj.weight_scale": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.157.up_proj.weight": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.157.up_proj.weight_scale": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.158.down_proj.weight": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.158.down_proj.weight_scale": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.158.gate_proj.weight": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.158.gate_proj.weight_scale": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.158.up_proj.weight": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.158.up_proj.weight_scale": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.159.down_proj.weight": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.159.down_proj.weight_scale": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.159.gate_proj.weight": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.159.gate_proj.weight_scale": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.159.up_proj.weight": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.159.up_proj.weight_scale": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.16.down_proj.weight": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.16.down_proj.weight_scale": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.16.gate_proj.weight": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.16.gate_proj.weight_scale": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.16.up_proj.weight": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.16.up_proj.weight_scale": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.17.down_proj.weight": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.17.down_proj.weight_scale": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.17.gate_proj.weight": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.17.gate_proj.weight_scale": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.17.up_proj.weight": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.17.up_proj.weight_scale": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.18.down_proj.weight": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.18.down_proj.weight_scale": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.18.gate_proj.weight": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.18.gate_proj.weight_scale": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.18.up_proj.weight": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.18.up_proj.weight_scale": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.19.down_proj.weight": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.19.down_proj.weight_scale": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.19.gate_proj.weight": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.19.gate_proj.weight_scale": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.19.up_proj.weight": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.19.up_proj.weight_scale": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.2.down_proj.weight": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.2.down_proj.weight_scale": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.2.gate_proj.weight": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.2.gate_proj.weight_scale": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.2.up_proj.weight": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.2.up_proj.weight_scale": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.20.down_proj.weight": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.20.down_proj.weight_scale": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.20.gate_proj.weight": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.20.gate_proj.weight_scale": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.20.up_proj.weight": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.20.up_proj.weight_scale": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.21.down_proj.weight": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.21.down_proj.weight_scale": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.21.gate_proj.weight": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.21.gate_proj.weight_scale": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.21.up_proj.weight": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.21.up_proj.weight_scale": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.22.down_proj.weight": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.22.down_proj.weight_scale": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.22.gate_proj.weight": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.22.gate_proj.weight_scale": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.22.up_proj.weight": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.22.up_proj.weight_scale": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.23.down_proj.weight": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.23.down_proj.weight_scale": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.23.gate_proj.weight": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.23.gate_proj.weight_scale": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.23.up_proj.weight": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.23.up_proj.weight_scale": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.24.down_proj.weight": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.24.down_proj.weight_scale": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.24.gate_proj.weight": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.24.gate_proj.weight_scale": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.24.up_proj.weight": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.24.up_proj.weight_scale": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.25.down_proj.weight": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.25.down_proj.weight_scale": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.25.gate_proj.weight": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.25.gate_proj.weight_scale": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.25.up_proj.weight": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.25.up_proj.weight_scale": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.26.down_proj.weight": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.26.down_proj.weight_scale": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.26.gate_proj.weight": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.26.gate_proj.weight_scale": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.26.up_proj.weight": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.26.up_proj.weight_scale": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.27.down_proj.weight": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.27.down_proj.weight_scale": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.27.gate_proj.weight": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.27.gate_proj.weight_scale": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.27.up_proj.weight": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.27.up_proj.weight_scale": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.28.down_proj.weight": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.28.down_proj.weight_scale": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.28.gate_proj.weight": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.28.gate_proj.weight_scale": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.28.up_proj.weight": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.28.up_proj.weight_scale": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.29.down_proj.weight": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.29.down_proj.weight_scale": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.29.gate_proj.weight": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.29.gate_proj.weight_scale": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.29.up_proj.weight": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.29.up_proj.weight_scale": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.3.down_proj.weight": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.3.down_proj.weight_scale": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.3.gate_proj.weight": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.3.gate_proj.weight_scale": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.3.up_proj.weight": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.3.up_proj.weight_scale": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.30.down_proj.weight": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.30.down_proj.weight_scale": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.30.gate_proj.weight": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.30.gate_proj.weight_scale": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.30.up_proj.weight": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.30.up_proj.weight_scale": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.31.down_proj.weight": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.31.down_proj.weight_scale": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.31.gate_proj.weight": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.31.gate_proj.weight_scale": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.31.up_proj.weight": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.31.up_proj.weight_scale": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.32.down_proj.weight": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.32.down_proj.weight_scale": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.32.gate_proj.weight": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.32.gate_proj.weight_scale": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.32.up_proj.weight": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.32.up_proj.weight_scale": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.33.down_proj.weight": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.33.down_proj.weight_scale": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.33.gate_proj.weight": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.33.gate_proj.weight_scale": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.33.up_proj.weight": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.33.up_proj.weight_scale": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.34.down_proj.weight": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.34.down_proj.weight_scale": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.34.gate_proj.weight": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.34.gate_proj.weight_scale": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.34.up_proj.weight": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.34.up_proj.weight_scale": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.35.down_proj.weight": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.35.down_proj.weight_scale": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.35.gate_proj.weight": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.35.gate_proj.weight_scale": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.35.up_proj.weight": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.35.up_proj.weight_scale": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.36.down_proj.weight": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.36.down_proj.weight_scale": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.36.gate_proj.weight": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.36.gate_proj.weight_scale": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.36.up_proj.weight": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.36.up_proj.weight_scale": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.37.down_proj.weight": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.37.down_proj.weight_scale": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.37.gate_proj.weight": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.37.gate_proj.weight_scale": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.37.up_proj.weight": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.37.up_proj.weight_scale": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.38.down_proj.weight": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.38.down_proj.weight_scale": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.38.gate_proj.weight": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.38.gate_proj.weight_scale": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.38.up_proj.weight": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.38.up_proj.weight_scale": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.39.down_proj.weight": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.39.down_proj.weight_scale": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.39.gate_proj.weight": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.39.gate_proj.weight_scale": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.39.up_proj.weight": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.39.up_proj.weight_scale": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.4.down_proj.weight": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.4.down_proj.weight_scale": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.4.gate_proj.weight": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.4.gate_proj.weight_scale": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.4.up_proj.weight": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.4.up_proj.weight_scale": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.40.down_proj.weight": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.40.down_proj.weight_scale": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.40.gate_proj.weight": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.40.gate_proj.weight_scale": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.40.up_proj.weight": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.40.up_proj.weight_scale": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.41.down_proj.weight": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.41.down_proj.weight_scale": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.41.gate_proj.weight": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.41.gate_proj.weight_scale": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.41.up_proj.weight": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.41.up_proj.weight_scale": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.42.down_proj.weight": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.42.down_proj.weight_scale": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.42.gate_proj.weight": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.42.gate_proj.weight_scale": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.42.up_proj.weight": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.42.up_proj.weight_scale": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.43.down_proj.weight": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.43.down_proj.weight_scale": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.43.gate_proj.weight": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.43.gate_proj.weight_scale": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.43.up_proj.weight": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.43.up_proj.weight_scale": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.44.down_proj.weight": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.44.down_proj.weight_scale": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.44.gate_proj.weight": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.44.gate_proj.weight_scale": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.44.up_proj.weight": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.44.up_proj.weight_scale": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.45.down_proj.weight": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.45.down_proj.weight_scale": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.45.gate_proj.weight": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.45.gate_proj.weight_scale": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.45.up_proj.weight": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.45.up_proj.weight_scale": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.46.down_proj.weight": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.46.down_proj.weight_scale": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.46.gate_proj.weight": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.46.gate_proj.weight_scale": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.46.up_proj.weight": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.46.up_proj.weight_scale": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.47.down_proj.weight": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.47.down_proj.weight_scale": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.47.gate_proj.weight": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.47.gate_proj.weight_scale": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.47.up_proj.weight": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.47.up_proj.weight_scale": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.48.down_proj.weight": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.48.down_proj.weight_scale": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.48.gate_proj.weight": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.48.gate_proj.weight_scale": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.48.up_proj.weight": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.48.up_proj.weight_scale": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.49.down_proj.weight": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.49.down_proj.weight_scale": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.49.gate_proj.weight": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.49.gate_proj.weight_scale": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.49.up_proj.weight": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.49.up_proj.weight_scale": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.5.down_proj.weight": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.5.down_proj.weight_scale": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.5.gate_proj.weight": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.5.gate_proj.weight_scale": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.5.up_proj.weight": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.5.up_proj.weight_scale": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.50.down_proj.weight": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.50.down_proj.weight_scale": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.50.gate_proj.weight": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.50.gate_proj.weight_scale": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.50.up_proj.weight": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.50.up_proj.weight_scale": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.51.down_proj.weight": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.51.down_proj.weight_scale": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.51.gate_proj.weight": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.51.gate_proj.weight_scale": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.51.up_proj.weight": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.51.up_proj.weight_scale": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.52.down_proj.weight": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.52.down_proj.weight_scale": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.52.gate_proj.weight": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.52.gate_proj.weight_scale": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.52.up_proj.weight": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.52.up_proj.weight_scale": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.53.down_proj.weight": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.53.down_proj.weight_scale": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.53.gate_proj.weight": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.53.gate_proj.weight_scale": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.53.up_proj.weight": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.53.up_proj.weight_scale": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.54.down_proj.weight": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.54.down_proj.weight_scale": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.54.gate_proj.weight": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.54.gate_proj.weight_scale": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.54.up_proj.weight": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.54.up_proj.weight_scale": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.55.down_proj.weight": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.55.down_proj.weight_scale": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.55.gate_proj.weight": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.55.gate_proj.weight_scale": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.55.up_proj.weight": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.55.up_proj.weight_scale": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.56.down_proj.weight": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.56.down_proj.weight_scale": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.56.gate_proj.weight": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.56.gate_proj.weight_scale": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.56.up_proj.weight": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.56.up_proj.weight_scale": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.57.down_proj.weight": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.57.down_proj.weight_scale": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.57.gate_proj.weight": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.57.gate_proj.weight_scale": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.57.up_proj.weight": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.57.up_proj.weight_scale": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.58.down_proj.weight": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.58.down_proj.weight_scale": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.58.gate_proj.weight": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.58.gate_proj.weight_scale": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.58.up_proj.weight": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.58.up_proj.weight_scale": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.59.down_proj.weight": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.59.down_proj.weight_scale": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.59.gate_proj.weight": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.59.gate_proj.weight_scale": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.59.up_proj.weight": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.59.up_proj.weight_scale": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.6.down_proj.weight": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.6.down_proj.weight_scale": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.6.gate_proj.weight": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.6.gate_proj.weight_scale": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.6.up_proj.weight": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.6.up_proj.weight_scale": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.60.down_proj.weight": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.60.down_proj.weight_scale": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.60.gate_proj.weight": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.60.gate_proj.weight_scale": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.60.up_proj.weight": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.60.up_proj.weight_scale": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.61.down_proj.weight": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.61.down_proj.weight_scale": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.61.gate_proj.weight": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.61.gate_proj.weight_scale": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.61.up_proj.weight": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.61.up_proj.weight_scale": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.62.down_proj.weight": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.62.down_proj.weight_scale": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.62.gate_proj.weight": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.62.gate_proj.weight_scale": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.62.up_proj.weight": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.62.up_proj.weight_scale": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.63.down_proj.weight": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.63.down_proj.weight_scale": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.63.gate_proj.weight": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.63.gate_proj.weight_scale": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.63.up_proj.weight": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.63.up_proj.weight_scale": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.64.down_proj.weight": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.64.down_proj.weight_scale": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.64.gate_proj.weight": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.64.gate_proj.weight_scale": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.64.up_proj.weight": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.64.up_proj.weight_scale": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.65.down_proj.weight": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.65.down_proj.weight_scale": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.65.gate_proj.weight": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.65.gate_proj.weight_scale": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.65.up_proj.weight": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.65.up_proj.weight_scale": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.66.down_proj.weight": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.66.down_proj.weight_scale": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.66.gate_proj.weight": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.66.gate_proj.weight_scale": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.66.up_proj.weight": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.66.up_proj.weight_scale": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.67.down_proj.weight": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.67.down_proj.weight_scale": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.67.gate_proj.weight": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.67.gate_proj.weight_scale": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.67.up_proj.weight": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.67.up_proj.weight_scale": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.68.down_proj.weight": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.68.down_proj.weight_scale": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.68.gate_proj.weight": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.68.gate_proj.weight_scale": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.68.up_proj.weight": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.68.up_proj.weight_scale": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.69.down_proj.weight": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.69.down_proj.weight_scale": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.69.gate_proj.weight": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.69.gate_proj.weight_scale": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.69.up_proj.weight": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.69.up_proj.weight_scale": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.7.down_proj.weight": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.7.down_proj.weight_scale": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.7.gate_proj.weight": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.7.gate_proj.weight_scale": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.7.up_proj.weight": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.7.up_proj.weight_scale": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.70.down_proj.weight": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.70.down_proj.weight_scale": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.70.gate_proj.weight": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.70.gate_proj.weight_scale": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.70.up_proj.weight": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.70.up_proj.weight_scale": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.71.down_proj.weight": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.71.down_proj.weight_scale": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.71.gate_proj.weight": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.71.gate_proj.weight_scale": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.71.up_proj.weight": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.71.up_proj.weight_scale": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.72.down_proj.weight": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.72.down_proj.weight_scale": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.72.gate_proj.weight": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.72.gate_proj.weight_scale": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.72.up_proj.weight": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.72.up_proj.weight_scale": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.73.down_proj.weight": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.73.down_proj.weight_scale": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.73.gate_proj.weight": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.73.gate_proj.weight_scale": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.73.up_proj.weight": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.73.up_proj.weight_scale": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.74.down_proj.weight": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.74.down_proj.weight_scale": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.74.gate_proj.weight": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.74.gate_proj.weight_scale": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.74.up_proj.weight": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.74.up_proj.weight_scale": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.75.down_proj.weight": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.75.down_proj.weight_scale": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.75.gate_proj.weight": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.75.gate_proj.weight_scale": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.75.up_proj.weight": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.75.up_proj.weight_scale": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.76.down_proj.weight": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.76.down_proj.weight_scale": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.76.gate_proj.weight": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.76.gate_proj.weight_scale": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.76.up_proj.weight": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.76.up_proj.weight_scale": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.77.down_proj.weight": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.77.down_proj.weight_scale": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.77.gate_proj.weight": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.77.gate_proj.weight_scale": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.77.up_proj.weight": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.77.up_proj.weight_scale": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.78.down_proj.weight": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.78.down_proj.weight_scale": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.78.gate_proj.weight": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.78.gate_proj.weight_scale": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.78.up_proj.weight": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.78.up_proj.weight_scale": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.79.down_proj.weight": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.79.down_proj.weight_scale": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.79.gate_proj.weight": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.79.gate_proj.weight_scale": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.79.up_proj.weight": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.79.up_proj.weight_scale": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.8.down_proj.weight": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.8.down_proj.weight_scale": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.8.gate_proj.weight": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.8.gate_proj.weight_scale": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.8.up_proj.weight": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.8.up_proj.weight_scale": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.80.down_proj.weight": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.80.down_proj.weight_scale": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.80.gate_proj.weight": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.80.gate_proj.weight_scale": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.80.up_proj.weight": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.80.up_proj.weight_scale": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.81.down_proj.weight": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.81.down_proj.weight_scale": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.81.gate_proj.weight": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.81.gate_proj.weight_scale": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.81.up_proj.weight": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.81.up_proj.weight_scale": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.82.down_proj.weight": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.82.down_proj.weight_scale": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.82.gate_proj.weight": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.82.gate_proj.weight_scale": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.82.up_proj.weight": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.82.up_proj.weight_scale": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.83.down_proj.weight": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.83.down_proj.weight_scale": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.83.gate_proj.weight": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.83.gate_proj.weight_scale": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.83.up_proj.weight": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.83.up_proj.weight_scale": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.84.down_proj.weight": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.84.down_proj.weight_scale": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.84.gate_proj.weight": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.84.gate_proj.weight_scale": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.84.up_proj.weight": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.84.up_proj.weight_scale": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.85.down_proj.weight": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.85.down_proj.weight_scale": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.85.gate_proj.weight": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.85.gate_proj.weight_scale": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.85.up_proj.weight": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.85.up_proj.weight_scale": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.86.down_proj.weight": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.86.down_proj.weight_scale": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.86.gate_proj.weight": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.86.gate_proj.weight_scale": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.86.up_proj.weight": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.86.up_proj.weight_scale": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.87.down_proj.weight": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.87.down_proj.weight_scale": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.87.gate_proj.weight": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.87.gate_proj.weight_scale": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.87.up_proj.weight": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.87.up_proj.weight_scale": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.88.down_proj.weight": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.88.down_proj.weight_scale": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.88.gate_proj.weight": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.88.gate_proj.weight_scale": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.88.up_proj.weight": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.88.up_proj.weight_scale": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.89.down_proj.weight": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.89.down_proj.weight_scale": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.89.gate_proj.weight": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.89.gate_proj.weight_scale": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.89.up_proj.weight": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.89.up_proj.weight_scale": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.9.down_proj.weight": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.9.down_proj.weight_scale": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.9.gate_proj.weight": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.9.gate_proj.weight_scale": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.9.up_proj.weight": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.9.up_proj.weight_scale": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.90.down_proj.weight": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.90.down_proj.weight_scale": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.90.gate_proj.weight": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.90.gate_proj.weight_scale": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.90.up_proj.weight": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.90.up_proj.weight_scale": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.91.down_proj.weight": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.91.down_proj.weight_scale": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.91.gate_proj.weight": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.91.gate_proj.weight_scale": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.91.up_proj.weight": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.91.up_proj.weight_scale": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.92.down_proj.weight": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.92.down_proj.weight_scale": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.92.gate_proj.weight": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.92.gate_proj.weight_scale": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.92.up_proj.weight": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.92.up_proj.weight_scale": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.93.down_proj.weight": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.93.down_proj.weight_scale": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.93.gate_proj.weight": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.93.gate_proj.weight_scale": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.93.up_proj.weight": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.93.up_proj.weight_scale": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.94.down_proj.weight": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.94.down_proj.weight_scale": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.94.gate_proj.weight": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.94.gate_proj.weight_scale": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.94.up_proj.weight": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.94.up_proj.weight_scale": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.95.down_proj.weight": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.95.down_proj.weight_scale": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.95.gate_proj.weight": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.95.gate_proj.weight_scale": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.95.up_proj.weight": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.95.up_proj.weight_scale": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.96.down_proj.weight": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.96.down_proj.weight_scale": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.96.gate_proj.weight": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.96.gate_proj.weight_scale": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.96.up_proj.weight": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.96.up_proj.weight_scale": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.97.down_proj.weight": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.97.down_proj.weight_scale": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.97.gate_proj.weight": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.97.gate_proj.weight_scale": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.97.up_proj.weight": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.97.up_proj.weight_scale": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.98.down_proj.weight": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.98.down_proj.weight_scale": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.98.gate_proj.weight": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.98.gate_proj.weight_scale": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.98.up_proj.weight": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.98.up_proj.weight_scale": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.99.down_proj.weight": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.99.down_proj.weight_scale": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.99.gate_proj.weight": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.99.gate_proj.weight_scale": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.99.up_proj.weight": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.99.up_proj.weight_scale": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.gate.e_score_correction_bias": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.gate.weight": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.shared_experts.down_proj.weight": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.shared_experts.down_proj.weight_scale": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.shared_experts.gate_proj.weight": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.shared_experts.gate_proj.weight_scale": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.shared_experts.up_proj.weight": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.shared_experts.up_proj.weight_scale": "model-00033-of-00092.safetensors",
+ "model.layers.32.post_attention_layernorm.weight": "model-00033-of-00092.safetensors",
+ "model.layers.32.self_attn.k_norm.weight": "model-00033-of-00092.safetensors",
+ "model.layers.32.self_attn.k_proj.bias": "model-00033-of-00092.safetensors",
+ "model.layers.32.self_attn.k_proj.weight": "model-00033-of-00092.safetensors",
+ "model.layers.32.self_attn.k_proj.weight_scale": "model-00033-of-00092.safetensors",
+ "model.layers.32.self_attn.o_proj.weight": "model-00033-of-00092.safetensors",
+ "model.layers.32.self_attn.o_proj.weight_scale": "model-00033-of-00092.safetensors",
+ "model.layers.32.self_attn.q_norm.weight": "model-00033-of-00092.safetensors",
+ "model.layers.32.self_attn.q_proj.bias": "model-00033-of-00092.safetensors",
+ "model.layers.32.self_attn.q_proj.weight": "model-00033-of-00092.safetensors",
+ "model.layers.32.self_attn.q_proj.weight_scale": "model-00033-of-00092.safetensors",
+ "model.layers.32.self_attn.v_proj.bias": "model-00033-of-00092.safetensors",
+ "model.layers.32.self_attn.v_proj.weight": "model-00033-of-00092.safetensors",
+ "model.layers.32.self_attn.v_proj.weight_scale": "model-00033-of-00092.safetensors",
+ "model.layers.33.input_layernorm.weight": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.0.down_proj.weight": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.0.down_proj.weight_scale": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.0.gate_proj.weight": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.0.gate_proj.weight_scale": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.0.up_proj.weight": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.0.up_proj.weight_scale": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.1.down_proj.weight": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.1.down_proj.weight_scale": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.1.gate_proj.weight": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.1.gate_proj.weight_scale": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.1.up_proj.weight": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.1.up_proj.weight_scale": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.10.down_proj.weight": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.10.down_proj.weight_scale": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.10.gate_proj.weight": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.10.gate_proj.weight_scale": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.10.up_proj.weight": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.10.up_proj.weight_scale": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.100.down_proj.weight": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.100.down_proj.weight_scale": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.100.gate_proj.weight": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.100.gate_proj.weight_scale": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.100.up_proj.weight": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.100.up_proj.weight_scale": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.101.down_proj.weight": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.101.down_proj.weight_scale": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.101.gate_proj.weight": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.101.gate_proj.weight_scale": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.101.up_proj.weight": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.101.up_proj.weight_scale": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.102.down_proj.weight": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.102.down_proj.weight_scale": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.102.gate_proj.weight": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.102.gate_proj.weight_scale": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.102.up_proj.weight": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.102.up_proj.weight_scale": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.103.down_proj.weight": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.103.down_proj.weight_scale": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.103.gate_proj.weight": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.103.gate_proj.weight_scale": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.103.up_proj.weight": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.103.up_proj.weight_scale": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.104.down_proj.weight": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.104.down_proj.weight_scale": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.104.gate_proj.weight": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.104.gate_proj.weight_scale": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.104.up_proj.weight": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.104.up_proj.weight_scale": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.105.down_proj.weight": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.105.down_proj.weight_scale": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.105.gate_proj.weight": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.105.gate_proj.weight_scale": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.105.up_proj.weight": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.105.up_proj.weight_scale": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.106.down_proj.weight": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.106.down_proj.weight_scale": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.106.gate_proj.weight": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.106.gate_proj.weight_scale": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.106.up_proj.weight": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.106.up_proj.weight_scale": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.107.down_proj.weight": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.107.down_proj.weight_scale": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.107.gate_proj.weight": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.107.gate_proj.weight_scale": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.107.up_proj.weight": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.107.up_proj.weight_scale": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.108.down_proj.weight": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.108.down_proj.weight_scale": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.108.gate_proj.weight": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.108.gate_proj.weight_scale": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.108.up_proj.weight": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.108.up_proj.weight_scale": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.109.down_proj.weight": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.109.down_proj.weight_scale": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.109.gate_proj.weight": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.109.gate_proj.weight_scale": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.109.up_proj.weight": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.109.up_proj.weight_scale": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.11.down_proj.weight": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.11.down_proj.weight_scale": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.11.gate_proj.weight": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.11.gate_proj.weight_scale": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.11.up_proj.weight": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.11.up_proj.weight_scale": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.110.down_proj.weight": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.110.down_proj.weight_scale": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.110.gate_proj.weight": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.110.gate_proj.weight_scale": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.110.up_proj.weight": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.110.up_proj.weight_scale": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.111.down_proj.weight": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.111.down_proj.weight_scale": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.111.gate_proj.weight": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.111.gate_proj.weight_scale": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.111.up_proj.weight": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.111.up_proj.weight_scale": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.112.down_proj.weight": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.112.down_proj.weight_scale": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.112.gate_proj.weight": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.112.gate_proj.weight_scale": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.112.up_proj.weight": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.112.up_proj.weight_scale": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.113.down_proj.weight": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.113.down_proj.weight_scale": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.113.gate_proj.weight": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.113.gate_proj.weight_scale": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.113.up_proj.weight": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.113.up_proj.weight_scale": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.114.down_proj.weight": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.114.down_proj.weight_scale": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.114.gate_proj.weight": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.114.gate_proj.weight_scale": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.114.up_proj.weight": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.114.up_proj.weight_scale": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.115.down_proj.weight": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.115.down_proj.weight_scale": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.115.gate_proj.weight": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.115.gate_proj.weight_scale": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.115.up_proj.weight": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.115.up_proj.weight_scale": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.116.down_proj.weight": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.116.down_proj.weight_scale": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.116.gate_proj.weight": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.116.gate_proj.weight_scale": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.116.up_proj.weight": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.116.up_proj.weight_scale": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.117.down_proj.weight": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.117.down_proj.weight_scale": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.117.gate_proj.weight": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.117.gate_proj.weight_scale": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.117.up_proj.weight": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.117.up_proj.weight_scale": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.118.down_proj.weight": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.118.down_proj.weight_scale": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.118.gate_proj.weight": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.118.gate_proj.weight_scale": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.118.up_proj.weight": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.118.up_proj.weight_scale": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.119.down_proj.weight": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.119.down_proj.weight_scale": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.119.gate_proj.weight": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.119.gate_proj.weight_scale": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.119.up_proj.weight": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.119.up_proj.weight_scale": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.12.down_proj.weight": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.12.down_proj.weight_scale": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.12.gate_proj.weight": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.12.gate_proj.weight_scale": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.12.up_proj.weight": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.12.up_proj.weight_scale": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.120.down_proj.weight": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.120.down_proj.weight_scale": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.120.gate_proj.weight": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.120.gate_proj.weight_scale": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.120.up_proj.weight": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.120.up_proj.weight_scale": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.121.down_proj.weight": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.121.down_proj.weight_scale": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.121.gate_proj.weight": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.121.gate_proj.weight_scale": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.121.up_proj.weight": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.121.up_proj.weight_scale": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.122.down_proj.weight": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.122.down_proj.weight_scale": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.122.gate_proj.weight": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.122.gate_proj.weight_scale": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.122.up_proj.weight": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.122.up_proj.weight_scale": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.123.down_proj.weight": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.123.down_proj.weight_scale": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.123.gate_proj.weight": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.123.gate_proj.weight_scale": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.123.up_proj.weight": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.123.up_proj.weight_scale": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.124.down_proj.weight": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.124.down_proj.weight_scale": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.124.gate_proj.weight": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.124.gate_proj.weight_scale": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.124.up_proj.weight": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.124.up_proj.weight_scale": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.125.down_proj.weight": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.125.down_proj.weight_scale": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.125.gate_proj.weight": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.125.gate_proj.weight_scale": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.125.up_proj.weight": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.125.up_proj.weight_scale": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.126.down_proj.weight": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.126.down_proj.weight_scale": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.126.gate_proj.weight": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.126.gate_proj.weight_scale": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.126.up_proj.weight": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.126.up_proj.weight_scale": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.127.down_proj.weight": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.127.down_proj.weight_scale": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.127.gate_proj.weight": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.127.gate_proj.weight_scale": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.127.up_proj.weight": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.127.up_proj.weight_scale": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.128.down_proj.weight": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.128.down_proj.weight_scale": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.128.gate_proj.weight": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.128.gate_proj.weight_scale": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.128.up_proj.weight": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.128.up_proj.weight_scale": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.129.down_proj.weight": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.129.down_proj.weight_scale": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.129.gate_proj.weight": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.129.gate_proj.weight_scale": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.129.up_proj.weight": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.129.up_proj.weight_scale": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.13.down_proj.weight": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.13.down_proj.weight_scale": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.13.gate_proj.weight": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.13.gate_proj.weight_scale": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.13.up_proj.weight": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.13.up_proj.weight_scale": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.130.down_proj.weight": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.130.down_proj.weight_scale": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.130.gate_proj.weight": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.130.gate_proj.weight_scale": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.130.up_proj.weight": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.130.up_proj.weight_scale": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.131.down_proj.weight": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.131.down_proj.weight_scale": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.131.gate_proj.weight": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.131.gate_proj.weight_scale": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.131.up_proj.weight": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.131.up_proj.weight_scale": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.132.down_proj.weight": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.132.down_proj.weight_scale": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.132.gate_proj.weight": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.132.gate_proj.weight_scale": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.132.up_proj.weight": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.132.up_proj.weight_scale": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.133.down_proj.weight": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.133.down_proj.weight_scale": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.133.gate_proj.weight": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.133.gate_proj.weight_scale": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.133.up_proj.weight": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.133.up_proj.weight_scale": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.134.down_proj.weight": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.134.down_proj.weight_scale": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.134.gate_proj.weight": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.134.gate_proj.weight_scale": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.134.up_proj.weight": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.134.up_proj.weight_scale": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.135.down_proj.weight": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.135.down_proj.weight_scale": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.135.gate_proj.weight": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.135.gate_proj.weight_scale": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.135.up_proj.weight": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.135.up_proj.weight_scale": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.136.down_proj.weight": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.136.down_proj.weight_scale": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.136.gate_proj.weight": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.136.gate_proj.weight_scale": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.136.up_proj.weight": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.136.up_proj.weight_scale": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.137.down_proj.weight": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.137.down_proj.weight_scale": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.137.gate_proj.weight": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.137.gate_proj.weight_scale": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.137.up_proj.weight": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.137.up_proj.weight_scale": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.138.down_proj.weight": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.138.down_proj.weight_scale": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.138.gate_proj.weight": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.138.gate_proj.weight_scale": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.138.up_proj.weight": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.138.up_proj.weight_scale": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.139.down_proj.weight": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.139.down_proj.weight_scale": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.139.gate_proj.weight": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.139.gate_proj.weight_scale": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.139.up_proj.weight": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.139.up_proj.weight_scale": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.14.down_proj.weight": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.14.down_proj.weight_scale": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.14.gate_proj.weight": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.14.gate_proj.weight_scale": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.14.up_proj.weight": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.14.up_proj.weight_scale": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.140.down_proj.weight": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.140.down_proj.weight_scale": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.140.gate_proj.weight": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.140.gate_proj.weight_scale": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.140.up_proj.weight": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.140.up_proj.weight_scale": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.141.down_proj.weight": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.141.down_proj.weight_scale": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.141.gate_proj.weight": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.141.gate_proj.weight_scale": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.141.up_proj.weight": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.141.up_proj.weight_scale": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.142.down_proj.weight": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.142.down_proj.weight_scale": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.142.gate_proj.weight": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.142.gate_proj.weight_scale": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.142.up_proj.weight": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.142.up_proj.weight_scale": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.143.down_proj.weight": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.143.down_proj.weight_scale": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.143.gate_proj.weight": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.143.gate_proj.weight_scale": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.143.up_proj.weight": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.143.up_proj.weight_scale": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.144.down_proj.weight": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.144.down_proj.weight_scale": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.144.gate_proj.weight": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.144.gate_proj.weight_scale": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.144.up_proj.weight": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.144.up_proj.weight_scale": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.145.down_proj.weight": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.145.down_proj.weight_scale": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.145.gate_proj.weight": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.145.gate_proj.weight_scale": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.145.up_proj.weight": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.145.up_proj.weight_scale": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.146.down_proj.weight": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.146.down_proj.weight_scale": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.146.gate_proj.weight": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.146.gate_proj.weight_scale": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.146.up_proj.weight": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.146.up_proj.weight_scale": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.147.down_proj.weight": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.147.down_proj.weight_scale": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.147.gate_proj.weight": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.147.gate_proj.weight_scale": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.147.up_proj.weight": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.147.up_proj.weight_scale": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.148.down_proj.weight": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.148.down_proj.weight_scale": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.148.gate_proj.weight": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.148.gate_proj.weight_scale": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.148.up_proj.weight": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.148.up_proj.weight_scale": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.149.down_proj.weight": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.149.down_proj.weight_scale": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.149.gate_proj.weight": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.149.gate_proj.weight_scale": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.149.up_proj.weight": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.149.up_proj.weight_scale": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.15.down_proj.weight": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.15.down_proj.weight_scale": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.15.gate_proj.weight": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.15.gate_proj.weight_scale": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.15.up_proj.weight": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.15.up_proj.weight_scale": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.150.down_proj.weight": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.150.down_proj.weight_scale": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.150.gate_proj.weight": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.150.gate_proj.weight_scale": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.150.up_proj.weight": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.150.up_proj.weight_scale": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.151.down_proj.weight": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.151.down_proj.weight_scale": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.151.gate_proj.weight": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.151.gate_proj.weight_scale": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.151.up_proj.weight": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.151.up_proj.weight_scale": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.152.down_proj.weight": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.152.down_proj.weight_scale": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.152.gate_proj.weight": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.152.gate_proj.weight_scale": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.152.up_proj.weight": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.152.up_proj.weight_scale": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.153.down_proj.weight": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.153.down_proj.weight_scale": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.153.gate_proj.weight": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.153.gate_proj.weight_scale": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.153.up_proj.weight": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.153.up_proj.weight_scale": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.154.down_proj.weight": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.154.down_proj.weight_scale": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.154.gate_proj.weight": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.154.gate_proj.weight_scale": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.154.up_proj.weight": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.154.up_proj.weight_scale": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.155.down_proj.weight": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.155.down_proj.weight_scale": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.155.gate_proj.weight": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.155.gate_proj.weight_scale": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.155.up_proj.weight": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.155.up_proj.weight_scale": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.156.down_proj.weight": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.156.down_proj.weight_scale": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.156.gate_proj.weight": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.156.gate_proj.weight_scale": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.156.up_proj.weight": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.156.up_proj.weight_scale": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.157.down_proj.weight": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.157.down_proj.weight_scale": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.157.gate_proj.weight": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.157.gate_proj.weight_scale": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.157.up_proj.weight": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.157.up_proj.weight_scale": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.158.down_proj.weight": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.158.down_proj.weight_scale": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.158.gate_proj.weight": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.158.gate_proj.weight_scale": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.158.up_proj.weight": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.158.up_proj.weight_scale": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.159.down_proj.weight": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.159.down_proj.weight_scale": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.159.gate_proj.weight": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.159.gate_proj.weight_scale": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.159.up_proj.weight": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.159.up_proj.weight_scale": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.16.down_proj.weight": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.16.down_proj.weight_scale": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.16.gate_proj.weight": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.16.gate_proj.weight_scale": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.16.up_proj.weight": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.16.up_proj.weight_scale": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.17.down_proj.weight": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.17.down_proj.weight_scale": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.17.gate_proj.weight": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.17.gate_proj.weight_scale": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.17.up_proj.weight": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.17.up_proj.weight_scale": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.18.down_proj.weight": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.18.down_proj.weight_scale": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.18.gate_proj.weight": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.18.gate_proj.weight_scale": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.18.up_proj.weight": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.18.up_proj.weight_scale": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.19.down_proj.weight": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.19.down_proj.weight_scale": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.19.gate_proj.weight": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.19.gate_proj.weight_scale": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.19.up_proj.weight": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.19.up_proj.weight_scale": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.2.down_proj.weight": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.2.down_proj.weight_scale": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.2.gate_proj.weight": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.2.gate_proj.weight_scale": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.2.up_proj.weight": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.2.up_proj.weight_scale": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.20.down_proj.weight": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.20.down_proj.weight_scale": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.20.gate_proj.weight": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.20.gate_proj.weight_scale": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.20.up_proj.weight": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.20.up_proj.weight_scale": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.21.down_proj.weight": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.21.down_proj.weight_scale": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.21.gate_proj.weight": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.21.gate_proj.weight_scale": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.21.up_proj.weight": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.21.up_proj.weight_scale": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.22.down_proj.weight": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.22.down_proj.weight_scale": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.22.gate_proj.weight": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.22.gate_proj.weight_scale": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.22.up_proj.weight": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.22.up_proj.weight_scale": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.23.down_proj.weight": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.23.down_proj.weight_scale": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.23.gate_proj.weight": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.23.gate_proj.weight_scale": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.23.up_proj.weight": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.23.up_proj.weight_scale": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.24.down_proj.weight": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.24.down_proj.weight_scale": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.24.gate_proj.weight": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.24.gate_proj.weight_scale": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.24.up_proj.weight": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.24.up_proj.weight_scale": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.25.down_proj.weight": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.25.down_proj.weight_scale": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.25.gate_proj.weight": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.25.gate_proj.weight_scale": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.25.up_proj.weight": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.25.up_proj.weight_scale": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.26.down_proj.weight": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.26.down_proj.weight_scale": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.26.gate_proj.weight": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.26.gate_proj.weight_scale": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.26.up_proj.weight": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.26.up_proj.weight_scale": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.27.down_proj.weight": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.27.down_proj.weight_scale": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.27.gate_proj.weight": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.27.gate_proj.weight_scale": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.27.up_proj.weight": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.27.up_proj.weight_scale": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.28.down_proj.weight": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.28.down_proj.weight_scale": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.28.gate_proj.weight": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.28.gate_proj.weight_scale": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.28.up_proj.weight": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.28.up_proj.weight_scale": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.29.down_proj.weight": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.29.down_proj.weight_scale": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.29.gate_proj.weight": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.29.gate_proj.weight_scale": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.29.up_proj.weight": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.29.up_proj.weight_scale": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.3.down_proj.weight": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.3.down_proj.weight_scale": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.3.gate_proj.weight": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.3.gate_proj.weight_scale": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.3.up_proj.weight": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.3.up_proj.weight_scale": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.30.down_proj.weight": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.30.down_proj.weight_scale": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.30.gate_proj.weight": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.30.gate_proj.weight_scale": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.30.up_proj.weight": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.30.up_proj.weight_scale": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.31.down_proj.weight": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.31.down_proj.weight_scale": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.31.gate_proj.weight": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.31.gate_proj.weight_scale": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.31.up_proj.weight": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.31.up_proj.weight_scale": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.32.down_proj.weight": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.32.down_proj.weight_scale": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.32.gate_proj.weight": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.32.gate_proj.weight_scale": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.32.up_proj.weight": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.32.up_proj.weight_scale": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.33.down_proj.weight": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.33.down_proj.weight_scale": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.33.gate_proj.weight": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.33.gate_proj.weight_scale": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.33.up_proj.weight": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.33.up_proj.weight_scale": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.34.down_proj.weight": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.34.down_proj.weight_scale": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.34.gate_proj.weight": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.34.gate_proj.weight_scale": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.34.up_proj.weight": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.34.up_proj.weight_scale": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.35.down_proj.weight": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.35.down_proj.weight_scale": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.35.gate_proj.weight": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.35.gate_proj.weight_scale": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.35.up_proj.weight": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.35.up_proj.weight_scale": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.36.down_proj.weight": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.36.down_proj.weight_scale": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.36.gate_proj.weight": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.36.gate_proj.weight_scale": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.36.up_proj.weight": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.36.up_proj.weight_scale": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.37.down_proj.weight": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.37.down_proj.weight_scale": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.37.gate_proj.weight": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.37.gate_proj.weight_scale": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.37.up_proj.weight": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.37.up_proj.weight_scale": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.38.down_proj.weight": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.38.down_proj.weight_scale": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.38.gate_proj.weight": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.38.gate_proj.weight_scale": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.38.up_proj.weight": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.38.up_proj.weight_scale": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.39.down_proj.weight": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.39.down_proj.weight_scale": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.39.gate_proj.weight": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.39.gate_proj.weight_scale": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.39.up_proj.weight": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.39.up_proj.weight_scale": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.4.down_proj.weight": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.4.down_proj.weight_scale": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.4.gate_proj.weight": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.4.gate_proj.weight_scale": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.4.up_proj.weight": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.4.up_proj.weight_scale": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.40.down_proj.weight": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.40.down_proj.weight_scale": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.40.gate_proj.weight": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.40.gate_proj.weight_scale": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.40.up_proj.weight": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.40.up_proj.weight_scale": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.41.down_proj.weight": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.41.down_proj.weight_scale": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.41.gate_proj.weight": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.41.gate_proj.weight_scale": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.41.up_proj.weight": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.41.up_proj.weight_scale": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.42.down_proj.weight": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.42.down_proj.weight_scale": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.42.gate_proj.weight": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.42.gate_proj.weight_scale": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.42.up_proj.weight": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.42.up_proj.weight_scale": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.43.down_proj.weight": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.43.down_proj.weight_scale": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.43.gate_proj.weight": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.43.gate_proj.weight_scale": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.43.up_proj.weight": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.43.up_proj.weight_scale": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.44.down_proj.weight": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.44.down_proj.weight_scale": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.44.gate_proj.weight": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.44.gate_proj.weight_scale": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.44.up_proj.weight": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.44.up_proj.weight_scale": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.45.down_proj.weight": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.45.down_proj.weight_scale": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.45.gate_proj.weight": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.45.gate_proj.weight_scale": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.45.up_proj.weight": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.45.up_proj.weight_scale": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.46.down_proj.weight": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.46.down_proj.weight_scale": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.46.gate_proj.weight": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.46.gate_proj.weight_scale": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.46.up_proj.weight": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.46.up_proj.weight_scale": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.47.down_proj.weight": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.47.down_proj.weight_scale": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.47.gate_proj.weight": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.47.gate_proj.weight_scale": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.47.up_proj.weight": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.47.up_proj.weight_scale": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.48.down_proj.weight": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.48.down_proj.weight_scale": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.48.gate_proj.weight": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.48.gate_proj.weight_scale": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.48.up_proj.weight": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.48.up_proj.weight_scale": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.49.down_proj.weight": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.49.down_proj.weight_scale": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.49.gate_proj.weight": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.49.gate_proj.weight_scale": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.49.up_proj.weight": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.49.up_proj.weight_scale": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.5.down_proj.weight": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.5.down_proj.weight_scale": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.5.gate_proj.weight": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.5.gate_proj.weight_scale": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.5.up_proj.weight": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.5.up_proj.weight_scale": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.50.down_proj.weight": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.50.down_proj.weight_scale": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.50.gate_proj.weight": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.50.gate_proj.weight_scale": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.50.up_proj.weight": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.50.up_proj.weight_scale": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.51.down_proj.weight": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.51.down_proj.weight_scale": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.51.gate_proj.weight": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.51.gate_proj.weight_scale": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.51.up_proj.weight": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.51.up_proj.weight_scale": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.52.down_proj.weight": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.52.down_proj.weight_scale": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.52.gate_proj.weight": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.52.gate_proj.weight_scale": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.52.up_proj.weight": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.52.up_proj.weight_scale": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.53.down_proj.weight": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.53.down_proj.weight_scale": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.53.gate_proj.weight": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.53.gate_proj.weight_scale": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.53.up_proj.weight": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.53.up_proj.weight_scale": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.54.down_proj.weight": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.54.down_proj.weight_scale": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.54.gate_proj.weight": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.54.gate_proj.weight_scale": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.54.up_proj.weight": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.54.up_proj.weight_scale": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.55.down_proj.weight": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.55.down_proj.weight_scale": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.55.gate_proj.weight": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.55.gate_proj.weight_scale": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.55.up_proj.weight": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.55.up_proj.weight_scale": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.56.down_proj.weight": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.56.down_proj.weight_scale": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.56.gate_proj.weight": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.56.gate_proj.weight_scale": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.56.up_proj.weight": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.56.up_proj.weight_scale": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.57.down_proj.weight": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.57.down_proj.weight_scale": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.57.gate_proj.weight": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.57.gate_proj.weight_scale": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.57.up_proj.weight": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.57.up_proj.weight_scale": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.58.down_proj.weight": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.58.down_proj.weight_scale": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.58.gate_proj.weight": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.58.gate_proj.weight_scale": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.58.up_proj.weight": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.58.up_proj.weight_scale": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.59.down_proj.weight": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.59.down_proj.weight_scale": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.59.gate_proj.weight": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.59.gate_proj.weight_scale": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.59.up_proj.weight": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.59.up_proj.weight_scale": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.6.down_proj.weight": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.6.down_proj.weight_scale": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.6.gate_proj.weight": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.6.gate_proj.weight_scale": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.6.up_proj.weight": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.6.up_proj.weight_scale": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.60.down_proj.weight": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.60.down_proj.weight_scale": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.60.gate_proj.weight": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.60.gate_proj.weight_scale": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.60.up_proj.weight": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.60.up_proj.weight_scale": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.61.down_proj.weight": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.61.down_proj.weight_scale": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.61.gate_proj.weight": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.61.gate_proj.weight_scale": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.61.up_proj.weight": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.61.up_proj.weight_scale": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.62.down_proj.weight": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.62.down_proj.weight_scale": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.62.gate_proj.weight": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.62.gate_proj.weight_scale": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.62.up_proj.weight": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.62.up_proj.weight_scale": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.63.down_proj.weight": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.63.down_proj.weight_scale": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.63.gate_proj.weight": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.63.gate_proj.weight_scale": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.63.up_proj.weight": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.63.up_proj.weight_scale": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.64.down_proj.weight": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.64.down_proj.weight_scale": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.64.gate_proj.weight": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.64.gate_proj.weight_scale": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.64.up_proj.weight": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.64.up_proj.weight_scale": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.65.down_proj.weight": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.65.down_proj.weight_scale": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.65.gate_proj.weight": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.65.gate_proj.weight_scale": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.65.up_proj.weight": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.65.up_proj.weight_scale": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.66.down_proj.weight": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.66.down_proj.weight_scale": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.66.gate_proj.weight": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.66.gate_proj.weight_scale": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.66.up_proj.weight": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.66.up_proj.weight_scale": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.67.down_proj.weight": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.67.down_proj.weight_scale": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.67.gate_proj.weight": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.67.gate_proj.weight_scale": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.67.up_proj.weight": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.67.up_proj.weight_scale": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.68.down_proj.weight": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.68.down_proj.weight_scale": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.68.gate_proj.weight": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.68.gate_proj.weight_scale": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.68.up_proj.weight": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.68.up_proj.weight_scale": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.69.down_proj.weight": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.69.down_proj.weight_scale": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.69.gate_proj.weight": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.69.gate_proj.weight_scale": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.69.up_proj.weight": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.69.up_proj.weight_scale": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.7.down_proj.weight": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.7.down_proj.weight_scale": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.7.gate_proj.weight": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.7.gate_proj.weight_scale": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.7.up_proj.weight": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.7.up_proj.weight_scale": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.70.down_proj.weight": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.70.down_proj.weight_scale": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.70.gate_proj.weight": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.70.gate_proj.weight_scale": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.70.up_proj.weight": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.70.up_proj.weight_scale": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.71.down_proj.weight": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.71.down_proj.weight_scale": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.71.gate_proj.weight": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.71.gate_proj.weight_scale": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.71.up_proj.weight": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.71.up_proj.weight_scale": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.72.down_proj.weight": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.72.down_proj.weight_scale": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.72.gate_proj.weight": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.72.gate_proj.weight_scale": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.72.up_proj.weight": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.72.up_proj.weight_scale": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.73.down_proj.weight": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.73.down_proj.weight_scale": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.73.gate_proj.weight": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.73.gate_proj.weight_scale": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.73.up_proj.weight": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.73.up_proj.weight_scale": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.74.down_proj.weight": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.74.down_proj.weight_scale": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.74.gate_proj.weight": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.74.gate_proj.weight_scale": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.74.up_proj.weight": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.74.up_proj.weight_scale": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.75.down_proj.weight": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.75.down_proj.weight_scale": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.75.gate_proj.weight": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.75.gate_proj.weight_scale": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.75.up_proj.weight": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.75.up_proj.weight_scale": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.76.down_proj.weight": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.76.down_proj.weight_scale": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.76.gate_proj.weight": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.76.gate_proj.weight_scale": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.76.up_proj.weight": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.76.up_proj.weight_scale": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.77.down_proj.weight": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.77.down_proj.weight_scale": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.77.gate_proj.weight": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.77.gate_proj.weight_scale": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.77.up_proj.weight": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.77.up_proj.weight_scale": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.78.down_proj.weight": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.78.down_proj.weight_scale": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.78.gate_proj.weight": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.78.gate_proj.weight_scale": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.78.up_proj.weight": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.78.up_proj.weight_scale": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.79.down_proj.weight": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.79.down_proj.weight_scale": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.79.gate_proj.weight": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.79.gate_proj.weight_scale": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.79.up_proj.weight": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.79.up_proj.weight_scale": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.8.down_proj.weight": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.8.down_proj.weight_scale": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.8.gate_proj.weight": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.8.gate_proj.weight_scale": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.8.up_proj.weight": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.8.up_proj.weight_scale": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.80.down_proj.weight": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.80.down_proj.weight_scale": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.80.gate_proj.weight": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.80.gate_proj.weight_scale": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.80.up_proj.weight": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.80.up_proj.weight_scale": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.81.down_proj.weight": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.81.down_proj.weight_scale": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.81.gate_proj.weight": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.81.gate_proj.weight_scale": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.81.up_proj.weight": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.81.up_proj.weight_scale": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.82.down_proj.weight": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.82.down_proj.weight_scale": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.82.gate_proj.weight": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.82.gate_proj.weight_scale": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.82.up_proj.weight": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.82.up_proj.weight_scale": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.83.down_proj.weight": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.83.down_proj.weight_scale": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.83.gate_proj.weight": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.83.gate_proj.weight_scale": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.83.up_proj.weight": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.83.up_proj.weight_scale": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.84.down_proj.weight": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.84.down_proj.weight_scale": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.84.gate_proj.weight": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.84.gate_proj.weight_scale": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.84.up_proj.weight": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.84.up_proj.weight_scale": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.85.down_proj.weight": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.85.down_proj.weight_scale": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.85.gate_proj.weight": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.85.gate_proj.weight_scale": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.85.up_proj.weight": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.85.up_proj.weight_scale": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.86.down_proj.weight": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.86.down_proj.weight_scale": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.86.gate_proj.weight": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.86.gate_proj.weight_scale": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.86.up_proj.weight": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.86.up_proj.weight_scale": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.87.down_proj.weight": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.87.down_proj.weight_scale": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.87.gate_proj.weight": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.87.gate_proj.weight_scale": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.87.up_proj.weight": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.87.up_proj.weight_scale": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.88.down_proj.weight": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.88.down_proj.weight_scale": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.88.gate_proj.weight": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.88.gate_proj.weight_scale": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.88.up_proj.weight": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.88.up_proj.weight_scale": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.89.down_proj.weight": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.89.down_proj.weight_scale": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.89.gate_proj.weight": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.89.gate_proj.weight_scale": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.89.up_proj.weight": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.89.up_proj.weight_scale": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.9.down_proj.weight": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.9.down_proj.weight_scale": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.9.gate_proj.weight": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.9.gate_proj.weight_scale": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.9.up_proj.weight": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.9.up_proj.weight_scale": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.90.down_proj.weight": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.90.down_proj.weight_scale": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.90.gate_proj.weight": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.90.gate_proj.weight_scale": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.90.up_proj.weight": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.90.up_proj.weight_scale": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.91.down_proj.weight": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.91.down_proj.weight_scale": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.91.gate_proj.weight": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.91.gate_proj.weight_scale": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.91.up_proj.weight": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.91.up_proj.weight_scale": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.92.down_proj.weight": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.92.down_proj.weight_scale": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.92.gate_proj.weight": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.92.gate_proj.weight_scale": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.92.up_proj.weight": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.92.up_proj.weight_scale": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.93.down_proj.weight": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.93.down_proj.weight_scale": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.93.gate_proj.weight": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.93.gate_proj.weight_scale": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.93.up_proj.weight": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.93.up_proj.weight_scale": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.94.down_proj.weight": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.94.down_proj.weight_scale": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.94.gate_proj.weight": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.94.gate_proj.weight_scale": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.94.up_proj.weight": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.94.up_proj.weight_scale": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.95.down_proj.weight": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.95.down_proj.weight_scale": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.95.gate_proj.weight": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.95.gate_proj.weight_scale": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.95.up_proj.weight": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.95.up_proj.weight_scale": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.96.down_proj.weight": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.96.down_proj.weight_scale": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.96.gate_proj.weight": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.96.gate_proj.weight_scale": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.96.up_proj.weight": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.96.up_proj.weight_scale": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.97.down_proj.weight": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.97.down_proj.weight_scale": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.97.gate_proj.weight": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.97.gate_proj.weight_scale": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.97.up_proj.weight": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.97.up_proj.weight_scale": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.98.down_proj.weight": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.98.down_proj.weight_scale": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.98.gate_proj.weight": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.98.gate_proj.weight_scale": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.98.up_proj.weight": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.98.up_proj.weight_scale": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.99.down_proj.weight": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.99.down_proj.weight_scale": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.99.gate_proj.weight": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.99.gate_proj.weight_scale": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.99.up_proj.weight": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.99.up_proj.weight_scale": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.gate.e_score_correction_bias": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.gate.weight": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.shared_experts.down_proj.weight": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.shared_experts.down_proj.weight_scale": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.shared_experts.gate_proj.weight": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.shared_experts.gate_proj.weight_scale": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.shared_experts.up_proj.weight": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.shared_experts.up_proj.weight_scale": "model-00034-of-00092.safetensors",
+ "model.layers.33.post_attention_layernorm.weight": "model-00034-of-00092.safetensors",
+ "model.layers.33.self_attn.k_norm.weight": "model-00034-of-00092.safetensors",
+ "model.layers.33.self_attn.k_proj.bias": "model-00034-of-00092.safetensors",
+ "model.layers.33.self_attn.k_proj.weight": "model-00034-of-00092.safetensors",
+ "model.layers.33.self_attn.k_proj.weight_scale": "model-00034-of-00092.safetensors",
+ "model.layers.33.self_attn.o_proj.weight": "model-00034-of-00092.safetensors",
+ "model.layers.33.self_attn.o_proj.weight_scale": "model-00034-of-00092.safetensors",
+ "model.layers.33.self_attn.q_norm.weight": "model-00034-of-00092.safetensors",
+ "model.layers.33.self_attn.q_proj.bias": "model-00034-of-00092.safetensors",
+ "model.layers.33.self_attn.q_proj.weight": "model-00034-of-00092.safetensors",
+ "model.layers.33.self_attn.q_proj.weight_scale": "model-00034-of-00092.safetensors",
+ "model.layers.33.self_attn.v_proj.bias": "model-00034-of-00092.safetensors",
+ "model.layers.33.self_attn.v_proj.weight": "model-00034-of-00092.safetensors",
+ "model.layers.33.self_attn.v_proj.weight_scale": "model-00034-of-00092.safetensors",
+ "model.layers.34.input_layernorm.weight": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.0.down_proj.weight": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.0.down_proj.weight_scale": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.0.gate_proj.weight": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.0.gate_proj.weight_scale": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.0.up_proj.weight": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.0.up_proj.weight_scale": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.1.down_proj.weight": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.1.down_proj.weight_scale": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.1.gate_proj.weight": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.1.gate_proj.weight_scale": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.1.up_proj.weight": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.1.up_proj.weight_scale": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.10.down_proj.weight": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.10.down_proj.weight_scale": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.10.gate_proj.weight": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.10.gate_proj.weight_scale": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.10.up_proj.weight": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.10.up_proj.weight_scale": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.100.down_proj.weight": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.100.down_proj.weight_scale": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.100.gate_proj.weight": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.100.gate_proj.weight_scale": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.100.up_proj.weight": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.100.up_proj.weight_scale": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.101.down_proj.weight": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.101.down_proj.weight_scale": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.101.gate_proj.weight": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.101.gate_proj.weight_scale": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.101.up_proj.weight": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.101.up_proj.weight_scale": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.102.down_proj.weight": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.102.down_proj.weight_scale": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.102.gate_proj.weight": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.102.gate_proj.weight_scale": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.102.up_proj.weight": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.102.up_proj.weight_scale": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.103.down_proj.weight": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.103.down_proj.weight_scale": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.103.gate_proj.weight": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.103.gate_proj.weight_scale": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.103.up_proj.weight": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.103.up_proj.weight_scale": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.104.down_proj.weight": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.104.down_proj.weight_scale": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.104.gate_proj.weight": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.104.gate_proj.weight_scale": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.104.up_proj.weight": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.104.up_proj.weight_scale": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.105.down_proj.weight": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.105.down_proj.weight_scale": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.105.gate_proj.weight": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.105.gate_proj.weight_scale": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.105.up_proj.weight": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.105.up_proj.weight_scale": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.106.down_proj.weight": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.106.down_proj.weight_scale": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.106.gate_proj.weight": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.106.gate_proj.weight_scale": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.106.up_proj.weight": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.106.up_proj.weight_scale": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.107.down_proj.weight": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.107.down_proj.weight_scale": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.107.gate_proj.weight": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.107.gate_proj.weight_scale": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.107.up_proj.weight": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.107.up_proj.weight_scale": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.108.down_proj.weight": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.108.down_proj.weight_scale": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.108.gate_proj.weight": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.108.gate_proj.weight_scale": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.108.up_proj.weight": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.108.up_proj.weight_scale": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.109.down_proj.weight": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.109.down_proj.weight_scale": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.109.gate_proj.weight": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.109.gate_proj.weight_scale": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.109.up_proj.weight": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.109.up_proj.weight_scale": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.11.down_proj.weight": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.11.down_proj.weight_scale": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.11.gate_proj.weight": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.11.gate_proj.weight_scale": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.11.up_proj.weight": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.11.up_proj.weight_scale": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.110.down_proj.weight": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.110.down_proj.weight_scale": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.110.gate_proj.weight": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.110.gate_proj.weight_scale": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.110.up_proj.weight": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.110.up_proj.weight_scale": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.111.down_proj.weight": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.111.down_proj.weight_scale": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.111.gate_proj.weight": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.111.gate_proj.weight_scale": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.111.up_proj.weight": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.111.up_proj.weight_scale": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.112.down_proj.weight": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.112.down_proj.weight_scale": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.112.gate_proj.weight": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.112.gate_proj.weight_scale": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.112.up_proj.weight": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.112.up_proj.weight_scale": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.113.down_proj.weight": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.113.down_proj.weight_scale": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.113.gate_proj.weight": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.113.gate_proj.weight_scale": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.113.up_proj.weight": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.113.up_proj.weight_scale": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.114.down_proj.weight": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.114.down_proj.weight_scale": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.114.gate_proj.weight": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.114.gate_proj.weight_scale": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.114.up_proj.weight": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.114.up_proj.weight_scale": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.115.down_proj.weight": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.115.down_proj.weight_scale": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.115.gate_proj.weight": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.115.gate_proj.weight_scale": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.115.up_proj.weight": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.115.up_proj.weight_scale": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.116.down_proj.weight": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.116.down_proj.weight_scale": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.116.gate_proj.weight": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.116.gate_proj.weight_scale": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.116.up_proj.weight": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.116.up_proj.weight_scale": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.117.down_proj.weight": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.117.down_proj.weight_scale": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.117.gate_proj.weight": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.117.gate_proj.weight_scale": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.117.up_proj.weight": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.117.up_proj.weight_scale": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.118.down_proj.weight": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.118.down_proj.weight_scale": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.118.gate_proj.weight": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.118.gate_proj.weight_scale": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.118.up_proj.weight": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.118.up_proj.weight_scale": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.119.down_proj.weight": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.119.down_proj.weight_scale": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.119.gate_proj.weight": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.119.gate_proj.weight_scale": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.119.up_proj.weight": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.119.up_proj.weight_scale": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.12.down_proj.weight": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.12.down_proj.weight_scale": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.12.gate_proj.weight": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.12.gate_proj.weight_scale": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.12.up_proj.weight": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.12.up_proj.weight_scale": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.120.down_proj.weight": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.120.down_proj.weight_scale": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.120.gate_proj.weight": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.120.gate_proj.weight_scale": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.120.up_proj.weight": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.120.up_proj.weight_scale": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.121.down_proj.weight": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.121.down_proj.weight_scale": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.121.gate_proj.weight": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.121.gate_proj.weight_scale": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.121.up_proj.weight": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.121.up_proj.weight_scale": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.122.down_proj.weight": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.122.down_proj.weight_scale": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.122.gate_proj.weight": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.122.gate_proj.weight_scale": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.122.up_proj.weight": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.122.up_proj.weight_scale": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.123.down_proj.weight": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.123.down_proj.weight_scale": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.123.gate_proj.weight": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.123.gate_proj.weight_scale": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.123.up_proj.weight": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.123.up_proj.weight_scale": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.124.down_proj.weight": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.124.down_proj.weight_scale": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.124.gate_proj.weight": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.124.gate_proj.weight_scale": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.124.up_proj.weight": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.124.up_proj.weight_scale": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.125.down_proj.weight": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.125.down_proj.weight_scale": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.125.gate_proj.weight": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.125.gate_proj.weight_scale": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.125.up_proj.weight": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.125.up_proj.weight_scale": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.126.down_proj.weight": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.126.down_proj.weight_scale": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.126.gate_proj.weight": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.126.gate_proj.weight_scale": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.126.up_proj.weight": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.126.up_proj.weight_scale": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.127.down_proj.weight": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.127.down_proj.weight_scale": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.127.gate_proj.weight": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.127.gate_proj.weight_scale": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.127.up_proj.weight": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.127.up_proj.weight_scale": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.128.down_proj.weight": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.128.down_proj.weight_scale": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.128.gate_proj.weight": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.128.gate_proj.weight_scale": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.128.up_proj.weight": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.128.up_proj.weight_scale": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.129.down_proj.weight": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.129.down_proj.weight_scale": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.129.gate_proj.weight": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.129.gate_proj.weight_scale": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.129.up_proj.weight": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.129.up_proj.weight_scale": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.13.down_proj.weight": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.13.down_proj.weight_scale": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.13.gate_proj.weight": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.13.gate_proj.weight_scale": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.13.up_proj.weight": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.13.up_proj.weight_scale": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.130.down_proj.weight": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.130.down_proj.weight_scale": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.130.gate_proj.weight": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.130.gate_proj.weight_scale": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.130.up_proj.weight": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.130.up_proj.weight_scale": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.131.down_proj.weight": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.131.down_proj.weight_scale": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.131.gate_proj.weight": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.131.gate_proj.weight_scale": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.131.up_proj.weight": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.131.up_proj.weight_scale": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.132.down_proj.weight": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.132.down_proj.weight_scale": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.132.gate_proj.weight": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.132.gate_proj.weight_scale": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.132.up_proj.weight": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.132.up_proj.weight_scale": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.133.down_proj.weight": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.133.down_proj.weight_scale": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.133.gate_proj.weight": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.133.gate_proj.weight_scale": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.133.up_proj.weight": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.133.up_proj.weight_scale": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.134.down_proj.weight": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.134.down_proj.weight_scale": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.134.gate_proj.weight": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.134.gate_proj.weight_scale": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.134.up_proj.weight": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.134.up_proj.weight_scale": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.135.down_proj.weight": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.135.down_proj.weight_scale": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.135.gate_proj.weight": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.135.gate_proj.weight_scale": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.135.up_proj.weight": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.135.up_proj.weight_scale": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.136.down_proj.weight": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.136.down_proj.weight_scale": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.136.gate_proj.weight": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.136.gate_proj.weight_scale": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.136.up_proj.weight": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.136.up_proj.weight_scale": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.137.down_proj.weight": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.137.down_proj.weight_scale": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.137.gate_proj.weight": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.137.gate_proj.weight_scale": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.137.up_proj.weight": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.137.up_proj.weight_scale": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.138.down_proj.weight": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.138.down_proj.weight_scale": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.138.gate_proj.weight": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.138.gate_proj.weight_scale": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.138.up_proj.weight": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.138.up_proj.weight_scale": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.139.down_proj.weight": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.139.down_proj.weight_scale": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.139.gate_proj.weight": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.139.gate_proj.weight_scale": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.139.up_proj.weight": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.139.up_proj.weight_scale": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.14.down_proj.weight": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.14.down_proj.weight_scale": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.14.gate_proj.weight": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.14.gate_proj.weight_scale": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.14.up_proj.weight": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.14.up_proj.weight_scale": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.140.down_proj.weight": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.140.down_proj.weight_scale": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.140.gate_proj.weight": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.140.gate_proj.weight_scale": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.140.up_proj.weight": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.140.up_proj.weight_scale": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.141.down_proj.weight": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.141.down_proj.weight_scale": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.141.gate_proj.weight": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.141.gate_proj.weight_scale": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.141.up_proj.weight": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.141.up_proj.weight_scale": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.142.down_proj.weight": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.142.down_proj.weight_scale": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.142.gate_proj.weight": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.142.gate_proj.weight_scale": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.142.up_proj.weight": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.142.up_proj.weight_scale": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.143.down_proj.weight": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.143.down_proj.weight_scale": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.143.gate_proj.weight": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.143.gate_proj.weight_scale": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.143.up_proj.weight": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.143.up_proj.weight_scale": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.144.down_proj.weight": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.144.down_proj.weight_scale": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.144.gate_proj.weight": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.144.gate_proj.weight_scale": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.144.up_proj.weight": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.144.up_proj.weight_scale": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.145.down_proj.weight": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.145.down_proj.weight_scale": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.145.gate_proj.weight": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.145.gate_proj.weight_scale": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.145.up_proj.weight": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.145.up_proj.weight_scale": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.146.down_proj.weight": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.146.down_proj.weight_scale": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.146.gate_proj.weight": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.146.gate_proj.weight_scale": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.146.up_proj.weight": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.146.up_proj.weight_scale": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.147.down_proj.weight": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.147.down_proj.weight_scale": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.147.gate_proj.weight": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.147.gate_proj.weight_scale": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.147.up_proj.weight": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.147.up_proj.weight_scale": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.148.down_proj.weight": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.148.down_proj.weight_scale": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.148.gate_proj.weight": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.148.gate_proj.weight_scale": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.148.up_proj.weight": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.148.up_proj.weight_scale": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.149.down_proj.weight": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.149.down_proj.weight_scale": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.149.gate_proj.weight": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.149.gate_proj.weight_scale": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.149.up_proj.weight": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.149.up_proj.weight_scale": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.15.down_proj.weight": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.15.down_proj.weight_scale": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.15.gate_proj.weight": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.15.gate_proj.weight_scale": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.15.up_proj.weight": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.15.up_proj.weight_scale": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.150.down_proj.weight": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.150.down_proj.weight_scale": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.150.gate_proj.weight": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.150.gate_proj.weight_scale": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.150.up_proj.weight": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.150.up_proj.weight_scale": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.151.down_proj.weight": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.151.down_proj.weight_scale": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.151.gate_proj.weight": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.151.gate_proj.weight_scale": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.151.up_proj.weight": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.151.up_proj.weight_scale": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.152.down_proj.weight": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.152.down_proj.weight_scale": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.152.gate_proj.weight": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.152.gate_proj.weight_scale": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.152.up_proj.weight": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.152.up_proj.weight_scale": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.153.down_proj.weight": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.153.down_proj.weight_scale": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.153.gate_proj.weight": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.153.gate_proj.weight_scale": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.153.up_proj.weight": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.153.up_proj.weight_scale": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.154.down_proj.weight": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.154.down_proj.weight_scale": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.154.gate_proj.weight": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.154.gate_proj.weight_scale": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.154.up_proj.weight": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.154.up_proj.weight_scale": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.155.down_proj.weight": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.155.down_proj.weight_scale": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.155.gate_proj.weight": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.155.gate_proj.weight_scale": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.155.up_proj.weight": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.155.up_proj.weight_scale": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.156.down_proj.weight": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.156.down_proj.weight_scale": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.156.gate_proj.weight": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.156.gate_proj.weight_scale": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.156.up_proj.weight": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.156.up_proj.weight_scale": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.157.down_proj.weight": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.157.down_proj.weight_scale": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.157.gate_proj.weight": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.157.gate_proj.weight_scale": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.157.up_proj.weight": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.157.up_proj.weight_scale": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.158.down_proj.weight": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.158.down_proj.weight_scale": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.158.gate_proj.weight": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.158.gate_proj.weight_scale": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.158.up_proj.weight": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.158.up_proj.weight_scale": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.159.down_proj.weight": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.159.down_proj.weight_scale": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.159.gate_proj.weight": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.159.gate_proj.weight_scale": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.159.up_proj.weight": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.159.up_proj.weight_scale": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.16.down_proj.weight": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.16.down_proj.weight_scale": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.16.gate_proj.weight": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.16.gate_proj.weight_scale": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.16.up_proj.weight": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.16.up_proj.weight_scale": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.17.down_proj.weight": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.17.down_proj.weight_scale": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.17.gate_proj.weight": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.17.gate_proj.weight_scale": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.17.up_proj.weight": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.17.up_proj.weight_scale": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.18.down_proj.weight": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.18.down_proj.weight_scale": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.18.gate_proj.weight": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.18.gate_proj.weight_scale": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.18.up_proj.weight": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.18.up_proj.weight_scale": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.19.down_proj.weight": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.19.down_proj.weight_scale": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.19.gate_proj.weight": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.19.gate_proj.weight_scale": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.19.up_proj.weight": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.19.up_proj.weight_scale": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.2.down_proj.weight": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.2.down_proj.weight_scale": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.2.gate_proj.weight": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.2.gate_proj.weight_scale": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.2.up_proj.weight": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.2.up_proj.weight_scale": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.20.down_proj.weight": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.20.down_proj.weight_scale": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.20.gate_proj.weight": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.20.gate_proj.weight_scale": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.20.up_proj.weight": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.20.up_proj.weight_scale": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.21.down_proj.weight": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.21.down_proj.weight_scale": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.21.gate_proj.weight": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.21.gate_proj.weight_scale": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.21.up_proj.weight": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.21.up_proj.weight_scale": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.22.down_proj.weight": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.22.down_proj.weight_scale": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.22.gate_proj.weight": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.22.gate_proj.weight_scale": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.22.up_proj.weight": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.22.up_proj.weight_scale": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.23.down_proj.weight": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.23.down_proj.weight_scale": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.23.gate_proj.weight": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.23.gate_proj.weight_scale": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.23.up_proj.weight": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.23.up_proj.weight_scale": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.24.down_proj.weight": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.24.down_proj.weight_scale": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.24.gate_proj.weight": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.24.gate_proj.weight_scale": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.24.up_proj.weight": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.24.up_proj.weight_scale": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.25.down_proj.weight": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.25.down_proj.weight_scale": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.25.gate_proj.weight": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.25.gate_proj.weight_scale": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.25.up_proj.weight": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.25.up_proj.weight_scale": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.26.down_proj.weight": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.26.down_proj.weight_scale": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.26.gate_proj.weight": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.26.gate_proj.weight_scale": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.26.up_proj.weight": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.26.up_proj.weight_scale": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.27.down_proj.weight": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.27.down_proj.weight_scale": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.27.gate_proj.weight": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.27.gate_proj.weight_scale": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.27.up_proj.weight": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.27.up_proj.weight_scale": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.28.down_proj.weight": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.28.down_proj.weight_scale": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.28.gate_proj.weight": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.28.gate_proj.weight_scale": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.28.up_proj.weight": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.28.up_proj.weight_scale": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.29.down_proj.weight": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.29.down_proj.weight_scale": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.29.gate_proj.weight": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.29.gate_proj.weight_scale": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.29.up_proj.weight": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.29.up_proj.weight_scale": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.3.down_proj.weight": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.3.down_proj.weight_scale": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.3.gate_proj.weight": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.3.gate_proj.weight_scale": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.3.up_proj.weight": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.3.up_proj.weight_scale": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.30.down_proj.weight": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.30.down_proj.weight_scale": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.30.gate_proj.weight": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.30.gate_proj.weight_scale": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.30.up_proj.weight": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.30.up_proj.weight_scale": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.31.down_proj.weight": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.31.down_proj.weight_scale": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.31.gate_proj.weight": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.31.gate_proj.weight_scale": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.31.up_proj.weight": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.31.up_proj.weight_scale": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.32.down_proj.weight": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.32.down_proj.weight_scale": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.32.gate_proj.weight": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.32.gate_proj.weight_scale": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.32.up_proj.weight": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.32.up_proj.weight_scale": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.33.down_proj.weight": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.33.down_proj.weight_scale": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.33.gate_proj.weight": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.33.gate_proj.weight_scale": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.33.up_proj.weight": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.33.up_proj.weight_scale": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.34.down_proj.weight": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.34.down_proj.weight_scale": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.34.gate_proj.weight": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.34.gate_proj.weight_scale": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.34.up_proj.weight": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.34.up_proj.weight_scale": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.35.down_proj.weight": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.35.down_proj.weight_scale": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.35.gate_proj.weight": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.35.gate_proj.weight_scale": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.35.up_proj.weight": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.35.up_proj.weight_scale": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.36.down_proj.weight": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.36.down_proj.weight_scale": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.36.gate_proj.weight": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.36.gate_proj.weight_scale": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.36.up_proj.weight": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.36.up_proj.weight_scale": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.37.down_proj.weight": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.37.down_proj.weight_scale": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.37.gate_proj.weight": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.37.gate_proj.weight_scale": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.37.up_proj.weight": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.37.up_proj.weight_scale": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.38.down_proj.weight": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.38.down_proj.weight_scale": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.38.gate_proj.weight": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.38.gate_proj.weight_scale": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.38.up_proj.weight": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.38.up_proj.weight_scale": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.39.down_proj.weight": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.39.down_proj.weight_scale": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.39.gate_proj.weight": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.39.gate_proj.weight_scale": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.39.up_proj.weight": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.39.up_proj.weight_scale": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.4.down_proj.weight": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.4.down_proj.weight_scale": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.4.gate_proj.weight": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.4.gate_proj.weight_scale": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.4.up_proj.weight": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.4.up_proj.weight_scale": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.40.down_proj.weight": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.40.down_proj.weight_scale": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.40.gate_proj.weight": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.40.gate_proj.weight_scale": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.40.up_proj.weight": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.40.up_proj.weight_scale": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.41.down_proj.weight": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.41.down_proj.weight_scale": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.41.gate_proj.weight": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.41.gate_proj.weight_scale": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.41.up_proj.weight": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.41.up_proj.weight_scale": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.42.down_proj.weight": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.42.down_proj.weight_scale": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.42.gate_proj.weight": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.42.gate_proj.weight_scale": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.42.up_proj.weight": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.42.up_proj.weight_scale": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.43.down_proj.weight": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.43.down_proj.weight_scale": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.43.gate_proj.weight": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.43.gate_proj.weight_scale": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.43.up_proj.weight": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.43.up_proj.weight_scale": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.44.down_proj.weight": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.44.down_proj.weight_scale": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.44.gate_proj.weight": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.44.gate_proj.weight_scale": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.44.up_proj.weight": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.44.up_proj.weight_scale": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.45.down_proj.weight": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.45.down_proj.weight_scale": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.45.gate_proj.weight": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.45.gate_proj.weight_scale": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.45.up_proj.weight": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.45.up_proj.weight_scale": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.46.down_proj.weight": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.46.down_proj.weight_scale": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.46.gate_proj.weight": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.46.gate_proj.weight_scale": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.46.up_proj.weight": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.46.up_proj.weight_scale": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.47.down_proj.weight": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.47.down_proj.weight_scale": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.47.gate_proj.weight": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.47.gate_proj.weight_scale": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.47.up_proj.weight": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.47.up_proj.weight_scale": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.48.down_proj.weight": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.48.down_proj.weight_scale": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.48.gate_proj.weight": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.48.gate_proj.weight_scale": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.48.up_proj.weight": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.48.up_proj.weight_scale": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.49.down_proj.weight": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.49.down_proj.weight_scale": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.49.gate_proj.weight": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.49.gate_proj.weight_scale": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.49.up_proj.weight": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.49.up_proj.weight_scale": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.5.down_proj.weight": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.5.down_proj.weight_scale": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.5.gate_proj.weight": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.5.gate_proj.weight_scale": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.5.up_proj.weight": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.5.up_proj.weight_scale": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.50.down_proj.weight": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.50.down_proj.weight_scale": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.50.gate_proj.weight": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.50.gate_proj.weight_scale": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.50.up_proj.weight": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.50.up_proj.weight_scale": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.51.down_proj.weight": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.51.down_proj.weight_scale": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.51.gate_proj.weight": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.51.gate_proj.weight_scale": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.51.up_proj.weight": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.51.up_proj.weight_scale": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.52.down_proj.weight": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.52.down_proj.weight_scale": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.52.gate_proj.weight": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.52.gate_proj.weight_scale": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.52.up_proj.weight": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.52.up_proj.weight_scale": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.53.down_proj.weight": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.53.down_proj.weight_scale": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.53.gate_proj.weight": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.53.gate_proj.weight_scale": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.53.up_proj.weight": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.53.up_proj.weight_scale": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.54.down_proj.weight": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.54.down_proj.weight_scale": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.54.gate_proj.weight": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.54.gate_proj.weight_scale": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.54.up_proj.weight": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.54.up_proj.weight_scale": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.55.down_proj.weight": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.55.down_proj.weight_scale": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.55.gate_proj.weight": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.55.gate_proj.weight_scale": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.55.up_proj.weight": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.55.up_proj.weight_scale": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.56.down_proj.weight": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.56.down_proj.weight_scale": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.56.gate_proj.weight": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.56.gate_proj.weight_scale": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.56.up_proj.weight": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.56.up_proj.weight_scale": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.57.down_proj.weight": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.57.down_proj.weight_scale": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.57.gate_proj.weight": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.57.gate_proj.weight_scale": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.57.up_proj.weight": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.57.up_proj.weight_scale": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.58.down_proj.weight": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.58.down_proj.weight_scale": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.58.gate_proj.weight": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.58.gate_proj.weight_scale": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.58.up_proj.weight": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.58.up_proj.weight_scale": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.59.down_proj.weight": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.59.down_proj.weight_scale": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.59.gate_proj.weight": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.59.gate_proj.weight_scale": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.59.up_proj.weight": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.59.up_proj.weight_scale": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.6.down_proj.weight": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.6.down_proj.weight_scale": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.6.gate_proj.weight": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.6.gate_proj.weight_scale": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.6.up_proj.weight": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.6.up_proj.weight_scale": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.60.down_proj.weight": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.60.down_proj.weight_scale": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.60.gate_proj.weight": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.60.gate_proj.weight_scale": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.60.up_proj.weight": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.60.up_proj.weight_scale": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.61.down_proj.weight": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.61.down_proj.weight_scale": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.61.gate_proj.weight": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.61.gate_proj.weight_scale": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.61.up_proj.weight": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.61.up_proj.weight_scale": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.62.down_proj.weight": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.62.down_proj.weight_scale": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.62.gate_proj.weight": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.62.gate_proj.weight_scale": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.62.up_proj.weight": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.62.up_proj.weight_scale": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.63.down_proj.weight": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.63.down_proj.weight_scale": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.63.gate_proj.weight": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.63.gate_proj.weight_scale": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.63.up_proj.weight": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.63.up_proj.weight_scale": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.64.down_proj.weight": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.64.down_proj.weight_scale": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.64.gate_proj.weight": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.64.gate_proj.weight_scale": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.64.up_proj.weight": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.64.up_proj.weight_scale": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.65.down_proj.weight": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.65.down_proj.weight_scale": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.65.gate_proj.weight": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.65.gate_proj.weight_scale": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.65.up_proj.weight": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.65.up_proj.weight_scale": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.66.down_proj.weight": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.66.down_proj.weight_scale": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.66.gate_proj.weight": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.66.gate_proj.weight_scale": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.66.up_proj.weight": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.66.up_proj.weight_scale": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.67.down_proj.weight": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.67.down_proj.weight_scale": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.67.gate_proj.weight": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.67.gate_proj.weight_scale": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.67.up_proj.weight": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.67.up_proj.weight_scale": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.68.down_proj.weight": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.68.down_proj.weight_scale": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.68.gate_proj.weight": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.68.gate_proj.weight_scale": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.68.up_proj.weight": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.68.up_proj.weight_scale": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.69.down_proj.weight": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.69.down_proj.weight_scale": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.69.gate_proj.weight": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.69.gate_proj.weight_scale": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.69.up_proj.weight": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.69.up_proj.weight_scale": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.7.down_proj.weight": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.7.down_proj.weight_scale": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.7.gate_proj.weight": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.7.gate_proj.weight_scale": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.7.up_proj.weight": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.7.up_proj.weight_scale": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.70.down_proj.weight": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.70.down_proj.weight_scale": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.70.gate_proj.weight": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.70.gate_proj.weight_scale": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.70.up_proj.weight": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.70.up_proj.weight_scale": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.71.down_proj.weight": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.71.down_proj.weight_scale": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.71.gate_proj.weight": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.71.gate_proj.weight_scale": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.71.up_proj.weight": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.71.up_proj.weight_scale": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.72.down_proj.weight": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.72.down_proj.weight_scale": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.72.gate_proj.weight": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.72.gate_proj.weight_scale": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.72.up_proj.weight": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.72.up_proj.weight_scale": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.73.down_proj.weight": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.73.down_proj.weight_scale": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.73.gate_proj.weight": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.73.gate_proj.weight_scale": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.73.up_proj.weight": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.73.up_proj.weight_scale": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.74.down_proj.weight": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.74.down_proj.weight_scale": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.74.gate_proj.weight": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.74.gate_proj.weight_scale": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.74.up_proj.weight": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.74.up_proj.weight_scale": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.75.down_proj.weight": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.75.down_proj.weight_scale": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.75.gate_proj.weight": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.75.gate_proj.weight_scale": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.75.up_proj.weight": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.75.up_proj.weight_scale": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.76.down_proj.weight": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.76.down_proj.weight_scale": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.76.gate_proj.weight": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.76.gate_proj.weight_scale": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.76.up_proj.weight": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.76.up_proj.weight_scale": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.77.down_proj.weight": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.77.down_proj.weight_scale": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.77.gate_proj.weight": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.77.gate_proj.weight_scale": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.77.up_proj.weight": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.77.up_proj.weight_scale": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.78.down_proj.weight": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.78.down_proj.weight_scale": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.78.gate_proj.weight": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.78.gate_proj.weight_scale": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.78.up_proj.weight": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.78.up_proj.weight_scale": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.79.down_proj.weight": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.79.down_proj.weight_scale": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.79.gate_proj.weight": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.79.gate_proj.weight_scale": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.79.up_proj.weight": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.79.up_proj.weight_scale": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.8.down_proj.weight": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.8.down_proj.weight_scale": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.8.gate_proj.weight": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.8.gate_proj.weight_scale": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.8.up_proj.weight": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.8.up_proj.weight_scale": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.80.down_proj.weight": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.80.down_proj.weight_scale": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.80.gate_proj.weight": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.80.gate_proj.weight_scale": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.80.up_proj.weight": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.80.up_proj.weight_scale": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.81.down_proj.weight": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.81.down_proj.weight_scale": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.81.gate_proj.weight": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.81.gate_proj.weight_scale": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.81.up_proj.weight": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.81.up_proj.weight_scale": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.82.down_proj.weight": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.82.down_proj.weight_scale": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.82.gate_proj.weight": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.82.gate_proj.weight_scale": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.82.up_proj.weight": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.82.up_proj.weight_scale": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.83.down_proj.weight": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.83.down_proj.weight_scale": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.83.gate_proj.weight": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.83.gate_proj.weight_scale": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.83.up_proj.weight": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.83.up_proj.weight_scale": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.84.down_proj.weight": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.84.down_proj.weight_scale": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.84.gate_proj.weight": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.84.gate_proj.weight_scale": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.84.up_proj.weight": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.84.up_proj.weight_scale": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.85.down_proj.weight": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.85.down_proj.weight_scale": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.85.gate_proj.weight": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.85.gate_proj.weight_scale": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.85.up_proj.weight": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.85.up_proj.weight_scale": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.86.down_proj.weight": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.86.down_proj.weight_scale": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.86.gate_proj.weight": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.86.gate_proj.weight_scale": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.86.up_proj.weight": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.86.up_proj.weight_scale": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.87.down_proj.weight": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.87.down_proj.weight_scale": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.87.gate_proj.weight": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.87.gate_proj.weight_scale": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.87.up_proj.weight": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.87.up_proj.weight_scale": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.88.down_proj.weight": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.88.down_proj.weight_scale": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.88.gate_proj.weight": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.88.gate_proj.weight_scale": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.88.up_proj.weight": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.88.up_proj.weight_scale": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.89.down_proj.weight": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.89.down_proj.weight_scale": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.89.gate_proj.weight": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.89.gate_proj.weight_scale": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.89.up_proj.weight": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.89.up_proj.weight_scale": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.9.down_proj.weight": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.9.down_proj.weight_scale": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.9.gate_proj.weight": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.9.gate_proj.weight_scale": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.9.up_proj.weight": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.9.up_proj.weight_scale": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.90.down_proj.weight": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.90.down_proj.weight_scale": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.90.gate_proj.weight": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.90.gate_proj.weight_scale": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.90.up_proj.weight": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.90.up_proj.weight_scale": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.91.down_proj.weight": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.91.down_proj.weight_scale": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.91.gate_proj.weight": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.91.gate_proj.weight_scale": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.91.up_proj.weight": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.91.up_proj.weight_scale": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.92.down_proj.weight": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.92.down_proj.weight_scale": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.92.gate_proj.weight": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.92.gate_proj.weight_scale": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.92.up_proj.weight": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.92.up_proj.weight_scale": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.93.down_proj.weight": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.93.down_proj.weight_scale": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.93.gate_proj.weight": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.93.gate_proj.weight_scale": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.93.up_proj.weight": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.93.up_proj.weight_scale": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.94.down_proj.weight": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.94.down_proj.weight_scale": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.94.gate_proj.weight": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.94.gate_proj.weight_scale": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.94.up_proj.weight": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.94.up_proj.weight_scale": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.95.down_proj.weight": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.95.down_proj.weight_scale": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.95.gate_proj.weight": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.95.gate_proj.weight_scale": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.95.up_proj.weight": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.95.up_proj.weight_scale": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.96.down_proj.weight": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.96.down_proj.weight_scale": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.96.gate_proj.weight": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.96.gate_proj.weight_scale": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.96.up_proj.weight": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.96.up_proj.weight_scale": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.97.down_proj.weight": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.97.down_proj.weight_scale": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.97.gate_proj.weight": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.97.gate_proj.weight_scale": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.97.up_proj.weight": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.97.up_proj.weight_scale": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.98.down_proj.weight": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.98.down_proj.weight_scale": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.98.gate_proj.weight": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.98.gate_proj.weight_scale": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.98.up_proj.weight": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.98.up_proj.weight_scale": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.99.down_proj.weight": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.99.down_proj.weight_scale": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.99.gate_proj.weight": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.99.gate_proj.weight_scale": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.99.up_proj.weight": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.99.up_proj.weight_scale": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.gate.e_score_correction_bias": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.gate.weight": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.shared_experts.down_proj.weight": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.shared_experts.down_proj.weight_scale": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.shared_experts.gate_proj.weight": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.shared_experts.gate_proj.weight_scale": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.shared_experts.up_proj.weight": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.shared_experts.up_proj.weight_scale": "model-00035-of-00092.safetensors",
+ "model.layers.34.post_attention_layernorm.weight": "model-00035-of-00092.safetensors",
+ "model.layers.34.self_attn.k_norm.weight": "model-00035-of-00092.safetensors",
+ "model.layers.34.self_attn.k_proj.bias": "model-00035-of-00092.safetensors",
+ "model.layers.34.self_attn.k_proj.weight": "model-00035-of-00092.safetensors",
+ "model.layers.34.self_attn.k_proj.weight_scale": "model-00035-of-00092.safetensors",
+ "model.layers.34.self_attn.o_proj.weight": "model-00035-of-00092.safetensors",
+ "model.layers.34.self_attn.o_proj.weight_scale": "model-00035-of-00092.safetensors",
+ "model.layers.34.self_attn.q_norm.weight": "model-00035-of-00092.safetensors",
+ "model.layers.34.self_attn.q_proj.bias": "model-00035-of-00092.safetensors",
+ "model.layers.34.self_attn.q_proj.weight": "model-00035-of-00092.safetensors",
+ "model.layers.34.self_attn.q_proj.weight_scale": "model-00035-of-00092.safetensors",
+ "model.layers.34.self_attn.v_proj.bias": "model-00035-of-00092.safetensors",
+ "model.layers.34.self_attn.v_proj.weight": "model-00035-of-00092.safetensors",
+ "model.layers.34.self_attn.v_proj.weight_scale": "model-00035-of-00092.safetensors",
+ "model.layers.35.input_layernorm.weight": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.0.down_proj.weight": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.0.down_proj.weight_scale": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.0.gate_proj.weight": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.0.gate_proj.weight_scale": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.0.up_proj.weight": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.0.up_proj.weight_scale": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.1.down_proj.weight": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.1.down_proj.weight_scale": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.1.gate_proj.weight": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.1.gate_proj.weight_scale": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.1.up_proj.weight": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.1.up_proj.weight_scale": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.10.down_proj.weight": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.10.down_proj.weight_scale": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.10.gate_proj.weight": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.10.gate_proj.weight_scale": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.10.up_proj.weight": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.10.up_proj.weight_scale": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.100.down_proj.weight": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.100.down_proj.weight_scale": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.100.gate_proj.weight": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.100.gate_proj.weight_scale": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.100.up_proj.weight": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.100.up_proj.weight_scale": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.101.down_proj.weight": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.101.down_proj.weight_scale": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.101.gate_proj.weight": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.101.gate_proj.weight_scale": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.101.up_proj.weight": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.101.up_proj.weight_scale": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.102.down_proj.weight": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.102.down_proj.weight_scale": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.102.gate_proj.weight": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.102.gate_proj.weight_scale": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.102.up_proj.weight": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.102.up_proj.weight_scale": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.103.down_proj.weight": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.103.down_proj.weight_scale": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.103.gate_proj.weight": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.103.gate_proj.weight_scale": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.103.up_proj.weight": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.103.up_proj.weight_scale": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.104.down_proj.weight": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.104.down_proj.weight_scale": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.104.gate_proj.weight": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.104.gate_proj.weight_scale": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.104.up_proj.weight": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.104.up_proj.weight_scale": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.105.down_proj.weight": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.105.down_proj.weight_scale": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.105.gate_proj.weight": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.105.gate_proj.weight_scale": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.105.up_proj.weight": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.105.up_proj.weight_scale": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.106.down_proj.weight": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.106.down_proj.weight_scale": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.106.gate_proj.weight": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.106.gate_proj.weight_scale": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.106.up_proj.weight": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.106.up_proj.weight_scale": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.107.down_proj.weight": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.107.down_proj.weight_scale": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.107.gate_proj.weight": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.107.gate_proj.weight_scale": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.107.up_proj.weight": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.107.up_proj.weight_scale": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.108.down_proj.weight": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.108.down_proj.weight_scale": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.108.gate_proj.weight": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.108.gate_proj.weight_scale": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.108.up_proj.weight": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.108.up_proj.weight_scale": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.109.down_proj.weight": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.109.down_proj.weight_scale": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.109.gate_proj.weight": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.109.gate_proj.weight_scale": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.109.up_proj.weight": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.109.up_proj.weight_scale": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.11.down_proj.weight": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.11.down_proj.weight_scale": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.11.gate_proj.weight": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.11.gate_proj.weight_scale": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.11.up_proj.weight": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.11.up_proj.weight_scale": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.110.down_proj.weight": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.110.down_proj.weight_scale": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.110.gate_proj.weight": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.110.gate_proj.weight_scale": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.110.up_proj.weight": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.110.up_proj.weight_scale": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.111.down_proj.weight": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.111.down_proj.weight_scale": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.111.gate_proj.weight": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.111.gate_proj.weight_scale": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.111.up_proj.weight": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.111.up_proj.weight_scale": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.112.down_proj.weight": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.112.down_proj.weight_scale": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.112.gate_proj.weight": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.112.gate_proj.weight_scale": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.112.up_proj.weight": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.112.up_proj.weight_scale": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.113.down_proj.weight": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.113.down_proj.weight_scale": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.113.gate_proj.weight": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.113.gate_proj.weight_scale": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.113.up_proj.weight": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.113.up_proj.weight_scale": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.114.down_proj.weight": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.114.down_proj.weight_scale": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.114.gate_proj.weight": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.114.gate_proj.weight_scale": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.114.up_proj.weight": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.114.up_proj.weight_scale": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.115.down_proj.weight": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.115.down_proj.weight_scale": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.115.gate_proj.weight": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.115.gate_proj.weight_scale": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.115.up_proj.weight": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.115.up_proj.weight_scale": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.116.down_proj.weight": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.116.down_proj.weight_scale": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.116.gate_proj.weight": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.116.gate_proj.weight_scale": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.116.up_proj.weight": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.116.up_proj.weight_scale": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.117.down_proj.weight": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.117.down_proj.weight_scale": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.117.gate_proj.weight": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.117.gate_proj.weight_scale": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.117.up_proj.weight": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.117.up_proj.weight_scale": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.118.down_proj.weight": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.118.down_proj.weight_scale": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.118.gate_proj.weight": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.118.gate_proj.weight_scale": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.118.up_proj.weight": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.118.up_proj.weight_scale": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.119.down_proj.weight": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.119.down_proj.weight_scale": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.119.gate_proj.weight": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.119.gate_proj.weight_scale": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.119.up_proj.weight": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.119.up_proj.weight_scale": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.12.down_proj.weight": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.12.down_proj.weight_scale": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.12.gate_proj.weight": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.12.gate_proj.weight_scale": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.12.up_proj.weight": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.12.up_proj.weight_scale": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.120.down_proj.weight": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.120.down_proj.weight_scale": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.120.gate_proj.weight": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.120.gate_proj.weight_scale": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.120.up_proj.weight": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.120.up_proj.weight_scale": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.121.down_proj.weight": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.121.down_proj.weight_scale": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.121.gate_proj.weight": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.121.gate_proj.weight_scale": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.121.up_proj.weight": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.121.up_proj.weight_scale": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.122.down_proj.weight": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.122.down_proj.weight_scale": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.122.gate_proj.weight": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.122.gate_proj.weight_scale": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.122.up_proj.weight": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.122.up_proj.weight_scale": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.123.down_proj.weight": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.123.down_proj.weight_scale": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.123.gate_proj.weight": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.123.gate_proj.weight_scale": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.123.up_proj.weight": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.123.up_proj.weight_scale": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.124.down_proj.weight": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.124.down_proj.weight_scale": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.124.gate_proj.weight": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.124.gate_proj.weight_scale": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.124.up_proj.weight": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.124.up_proj.weight_scale": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.125.down_proj.weight": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.125.down_proj.weight_scale": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.125.gate_proj.weight": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.125.gate_proj.weight_scale": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.125.up_proj.weight": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.125.up_proj.weight_scale": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.126.down_proj.weight": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.126.down_proj.weight_scale": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.126.gate_proj.weight": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.126.gate_proj.weight_scale": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.126.up_proj.weight": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.126.up_proj.weight_scale": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.127.down_proj.weight": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.127.down_proj.weight_scale": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.127.gate_proj.weight": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.127.gate_proj.weight_scale": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.127.up_proj.weight": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.127.up_proj.weight_scale": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.128.down_proj.weight": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.128.down_proj.weight_scale": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.128.gate_proj.weight": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.128.gate_proj.weight_scale": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.128.up_proj.weight": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.128.up_proj.weight_scale": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.129.down_proj.weight": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.129.down_proj.weight_scale": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.129.gate_proj.weight": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.129.gate_proj.weight_scale": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.129.up_proj.weight": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.129.up_proj.weight_scale": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.13.down_proj.weight": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.13.down_proj.weight_scale": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.13.gate_proj.weight": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.13.gate_proj.weight_scale": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.13.up_proj.weight": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.13.up_proj.weight_scale": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.130.down_proj.weight": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.130.down_proj.weight_scale": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.130.gate_proj.weight": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.130.gate_proj.weight_scale": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.130.up_proj.weight": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.130.up_proj.weight_scale": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.131.down_proj.weight": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.131.down_proj.weight_scale": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.131.gate_proj.weight": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.131.gate_proj.weight_scale": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.131.up_proj.weight": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.131.up_proj.weight_scale": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.132.down_proj.weight": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.132.down_proj.weight_scale": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.132.gate_proj.weight": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.132.gate_proj.weight_scale": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.132.up_proj.weight": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.132.up_proj.weight_scale": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.133.down_proj.weight": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.133.down_proj.weight_scale": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.133.gate_proj.weight": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.133.gate_proj.weight_scale": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.133.up_proj.weight": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.133.up_proj.weight_scale": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.134.down_proj.weight": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.134.down_proj.weight_scale": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.134.gate_proj.weight": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.134.gate_proj.weight_scale": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.134.up_proj.weight": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.134.up_proj.weight_scale": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.135.down_proj.weight": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.135.down_proj.weight_scale": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.135.gate_proj.weight": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.135.gate_proj.weight_scale": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.135.up_proj.weight": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.135.up_proj.weight_scale": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.136.down_proj.weight": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.136.down_proj.weight_scale": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.136.gate_proj.weight": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.136.gate_proj.weight_scale": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.136.up_proj.weight": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.136.up_proj.weight_scale": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.137.down_proj.weight": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.137.down_proj.weight_scale": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.137.gate_proj.weight": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.137.gate_proj.weight_scale": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.137.up_proj.weight": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.137.up_proj.weight_scale": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.138.down_proj.weight": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.138.down_proj.weight_scale": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.138.gate_proj.weight": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.138.gate_proj.weight_scale": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.138.up_proj.weight": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.138.up_proj.weight_scale": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.139.down_proj.weight": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.139.down_proj.weight_scale": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.139.gate_proj.weight": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.139.gate_proj.weight_scale": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.139.up_proj.weight": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.139.up_proj.weight_scale": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.14.down_proj.weight": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.14.down_proj.weight_scale": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.14.gate_proj.weight": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.14.gate_proj.weight_scale": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.14.up_proj.weight": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.14.up_proj.weight_scale": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.140.down_proj.weight": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.140.down_proj.weight_scale": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.140.gate_proj.weight": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.140.gate_proj.weight_scale": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.140.up_proj.weight": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.140.up_proj.weight_scale": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.141.down_proj.weight": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.141.down_proj.weight_scale": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.141.gate_proj.weight": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.141.gate_proj.weight_scale": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.141.up_proj.weight": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.141.up_proj.weight_scale": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.142.down_proj.weight": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.142.down_proj.weight_scale": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.142.gate_proj.weight": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.142.gate_proj.weight_scale": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.142.up_proj.weight": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.142.up_proj.weight_scale": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.143.down_proj.weight": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.143.down_proj.weight_scale": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.143.gate_proj.weight": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.143.gate_proj.weight_scale": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.143.up_proj.weight": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.143.up_proj.weight_scale": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.144.down_proj.weight": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.144.down_proj.weight_scale": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.144.gate_proj.weight": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.144.gate_proj.weight_scale": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.144.up_proj.weight": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.144.up_proj.weight_scale": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.145.down_proj.weight": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.145.down_proj.weight_scale": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.145.gate_proj.weight": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.145.gate_proj.weight_scale": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.145.up_proj.weight": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.145.up_proj.weight_scale": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.146.down_proj.weight": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.146.down_proj.weight_scale": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.146.gate_proj.weight": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.146.gate_proj.weight_scale": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.146.up_proj.weight": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.146.up_proj.weight_scale": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.147.down_proj.weight": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.147.down_proj.weight_scale": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.147.gate_proj.weight": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.147.gate_proj.weight_scale": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.147.up_proj.weight": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.147.up_proj.weight_scale": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.148.down_proj.weight": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.148.down_proj.weight_scale": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.148.gate_proj.weight": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.148.gate_proj.weight_scale": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.148.up_proj.weight": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.148.up_proj.weight_scale": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.149.down_proj.weight": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.149.down_proj.weight_scale": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.149.gate_proj.weight": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.149.gate_proj.weight_scale": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.149.up_proj.weight": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.149.up_proj.weight_scale": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.15.down_proj.weight": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.15.down_proj.weight_scale": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.15.gate_proj.weight": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.15.gate_proj.weight_scale": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.15.up_proj.weight": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.15.up_proj.weight_scale": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.150.down_proj.weight": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.150.down_proj.weight_scale": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.150.gate_proj.weight": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.150.gate_proj.weight_scale": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.150.up_proj.weight": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.150.up_proj.weight_scale": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.151.down_proj.weight": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.151.down_proj.weight_scale": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.151.gate_proj.weight": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.151.gate_proj.weight_scale": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.151.up_proj.weight": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.151.up_proj.weight_scale": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.152.down_proj.weight": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.152.down_proj.weight_scale": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.152.gate_proj.weight": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.152.gate_proj.weight_scale": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.152.up_proj.weight": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.152.up_proj.weight_scale": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.153.down_proj.weight": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.153.down_proj.weight_scale": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.153.gate_proj.weight": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.153.gate_proj.weight_scale": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.153.up_proj.weight": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.153.up_proj.weight_scale": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.154.down_proj.weight": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.154.down_proj.weight_scale": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.154.gate_proj.weight": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.154.gate_proj.weight_scale": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.154.up_proj.weight": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.154.up_proj.weight_scale": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.155.down_proj.weight": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.155.down_proj.weight_scale": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.155.gate_proj.weight": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.155.gate_proj.weight_scale": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.155.up_proj.weight": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.155.up_proj.weight_scale": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.156.down_proj.weight": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.156.down_proj.weight_scale": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.156.gate_proj.weight": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.156.gate_proj.weight_scale": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.156.up_proj.weight": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.156.up_proj.weight_scale": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.157.down_proj.weight": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.157.down_proj.weight_scale": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.157.gate_proj.weight": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.157.gate_proj.weight_scale": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.157.up_proj.weight": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.157.up_proj.weight_scale": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.158.down_proj.weight": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.158.down_proj.weight_scale": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.158.gate_proj.weight": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.158.gate_proj.weight_scale": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.158.up_proj.weight": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.158.up_proj.weight_scale": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.159.down_proj.weight": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.159.down_proj.weight_scale": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.159.gate_proj.weight": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.159.gate_proj.weight_scale": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.159.up_proj.weight": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.159.up_proj.weight_scale": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.16.down_proj.weight": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.16.down_proj.weight_scale": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.16.gate_proj.weight": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.16.gate_proj.weight_scale": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.16.up_proj.weight": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.16.up_proj.weight_scale": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.17.down_proj.weight": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.17.down_proj.weight_scale": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.17.gate_proj.weight": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.17.gate_proj.weight_scale": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.17.up_proj.weight": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.17.up_proj.weight_scale": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.18.down_proj.weight": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.18.down_proj.weight_scale": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.18.gate_proj.weight": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.18.gate_proj.weight_scale": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.18.up_proj.weight": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.18.up_proj.weight_scale": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.19.down_proj.weight": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.19.down_proj.weight_scale": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.19.gate_proj.weight": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.19.gate_proj.weight_scale": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.19.up_proj.weight": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.19.up_proj.weight_scale": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.2.down_proj.weight": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.2.down_proj.weight_scale": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.2.gate_proj.weight": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.2.gate_proj.weight_scale": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.2.up_proj.weight": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.2.up_proj.weight_scale": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.20.down_proj.weight": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.20.down_proj.weight_scale": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.20.gate_proj.weight": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.20.gate_proj.weight_scale": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.20.up_proj.weight": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.20.up_proj.weight_scale": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.21.down_proj.weight": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.21.down_proj.weight_scale": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.21.gate_proj.weight": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.21.gate_proj.weight_scale": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.21.up_proj.weight": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.21.up_proj.weight_scale": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.22.down_proj.weight": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.22.down_proj.weight_scale": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.22.gate_proj.weight": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.22.gate_proj.weight_scale": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.22.up_proj.weight": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.22.up_proj.weight_scale": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.23.down_proj.weight": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.23.down_proj.weight_scale": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.23.gate_proj.weight": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.23.gate_proj.weight_scale": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.23.up_proj.weight": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.23.up_proj.weight_scale": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.24.down_proj.weight": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.24.down_proj.weight_scale": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.24.gate_proj.weight": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.24.gate_proj.weight_scale": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.24.up_proj.weight": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.24.up_proj.weight_scale": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.25.down_proj.weight": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.25.down_proj.weight_scale": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.25.gate_proj.weight": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.25.gate_proj.weight_scale": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.25.up_proj.weight": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.25.up_proj.weight_scale": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.26.down_proj.weight": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.26.down_proj.weight_scale": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.26.gate_proj.weight": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.26.gate_proj.weight_scale": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.26.up_proj.weight": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.26.up_proj.weight_scale": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.27.down_proj.weight": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.27.down_proj.weight_scale": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.27.gate_proj.weight": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.27.gate_proj.weight_scale": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.27.up_proj.weight": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.27.up_proj.weight_scale": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.28.down_proj.weight": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.28.down_proj.weight_scale": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.28.gate_proj.weight": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.28.gate_proj.weight_scale": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.28.up_proj.weight": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.28.up_proj.weight_scale": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.29.down_proj.weight": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.29.down_proj.weight_scale": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.29.gate_proj.weight": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.29.gate_proj.weight_scale": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.29.up_proj.weight": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.29.up_proj.weight_scale": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.3.down_proj.weight": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.3.down_proj.weight_scale": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.3.gate_proj.weight": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.3.gate_proj.weight_scale": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.3.up_proj.weight": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.3.up_proj.weight_scale": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.30.down_proj.weight": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.30.down_proj.weight_scale": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.30.gate_proj.weight": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.30.gate_proj.weight_scale": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.30.up_proj.weight": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.30.up_proj.weight_scale": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.31.down_proj.weight": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.31.down_proj.weight_scale": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.31.gate_proj.weight": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.31.gate_proj.weight_scale": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.31.up_proj.weight": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.31.up_proj.weight_scale": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.32.down_proj.weight": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.32.down_proj.weight_scale": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.32.gate_proj.weight": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.32.gate_proj.weight_scale": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.32.up_proj.weight": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.32.up_proj.weight_scale": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.33.down_proj.weight": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.33.down_proj.weight_scale": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.33.gate_proj.weight": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.33.gate_proj.weight_scale": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.33.up_proj.weight": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.33.up_proj.weight_scale": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.34.down_proj.weight": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.34.down_proj.weight_scale": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.34.gate_proj.weight": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.34.gate_proj.weight_scale": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.34.up_proj.weight": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.34.up_proj.weight_scale": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.35.down_proj.weight": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.35.down_proj.weight_scale": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.35.gate_proj.weight": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.35.gate_proj.weight_scale": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.35.up_proj.weight": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.35.up_proj.weight_scale": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.36.down_proj.weight": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.36.down_proj.weight_scale": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.36.gate_proj.weight": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.36.gate_proj.weight_scale": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.36.up_proj.weight": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.36.up_proj.weight_scale": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.37.down_proj.weight": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.37.down_proj.weight_scale": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.37.gate_proj.weight": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.37.gate_proj.weight_scale": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.37.up_proj.weight": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.37.up_proj.weight_scale": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.38.down_proj.weight": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.38.down_proj.weight_scale": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.38.gate_proj.weight": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.38.gate_proj.weight_scale": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.38.up_proj.weight": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.38.up_proj.weight_scale": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.39.down_proj.weight": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.39.down_proj.weight_scale": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.39.gate_proj.weight": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.39.gate_proj.weight_scale": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.39.up_proj.weight": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.39.up_proj.weight_scale": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.4.down_proj.weight": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.4.down_proj.weight_scale": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.4.gate_proj.weight": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.4.gate_proj.weight_scale": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.4.up_proj.weight": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.4.up_proj.weight_scale": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.40.down_proj.weight": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.40.down_proj.weight_scale": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.40.gate_proj.weight": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.40.gate_proj.weight_scale": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.40.up_proj.weight": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.40.up_proj.weight_scale": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.41.down_proj.weight": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.41.down_proj.weight_scale": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.41.gate_proj.weight": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.41.gate_proj.weight_scale": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.41.up_proj.weight": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.41.up_proj.weight_scale": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.42.down_proj.weight": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.42.down_proj.weight_scale": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.42.gate_proj.weight": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.42.gate_proj.weight_scale": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.42.up_proj.weight": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.42.up_proj.weight_scale": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.43.down_proj.weight": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.43.down_proj.weight_scale": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.43.gate_proj.weight": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.43.gate_proj.weight_scale": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.43.up_proj.weight": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.43.up_proj.weight_scale": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.44.down_proj.weight": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.44.down_proj.weight_scale": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.44.gate_proj.weight": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.44.gate_proj.weight_scale": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.44.up_proj.weight": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.44.up_proj.weight_scale": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.45.down_proj.weight": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.45.down_proj.weight_scale": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.45.gate_proj.weight": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.45.gate_proj.weight_scale": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.45.up_proj.weight": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.45.up_proj.weight_scale": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.46.down_proj.weight": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.46.down_proj.weight_scale": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.46.gate_proj.weight": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.46.gate_proj.weight_scale": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.46.up_proj.weight": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.46.up_proj.weight_scale": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.47.down_proj.weight": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.47.down_proj.weight_scale": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.47.gate_proj.weight": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.47.gate_proj.weight_scale": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.47.up_proj.weight": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.47.up_proj.weight_scale": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.48.down_proj.weight": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.48.down_proj.weight_scale": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.48.gate_proj.weight": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.48.gate_proj.weight_scale": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.48.up_proj.weight": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.48.up_proj.weight_scale": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.49.down_proj.weight": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.49.down_proj.weight_scale": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.49.gate_proj.weight": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.49.gate_proj.weight_scale": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.49.up_proj.weight": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.49.up_proj.weight_scale": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.5.down_proj.weight": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.5.down_proj.weight_scale": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.5.gate_proj.weight": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.5.gate_proj.weight_scale": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.5.up_proj.weight": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.5.up_proj.weight_scale": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.50.down_proj.weight": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.50.down_proj.weight_scale": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.50.gate_proj.weight": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.50.gate_proj.weight_scale": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.50.up_proj.weight": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.50.up_proj.weight_scale": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.51.down_proj.weight": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.51.down_proj.weight_scale": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.51.gate_proj.weight": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.51.gate_proj.weight_scale": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.51.up_proj.weight": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.51.up_proj.weight_scale": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.52.down_proj.weight": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.52.down_proj.weight_scale": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.52.gate_proj.weight": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.52.gate_proj.weight_scale": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.52.up_proj.weight": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.52.up_proj.weight_scale": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.53.down_proj.weight": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.53.down_proj.weight_scale": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.53.gate_proj.weight": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.53.gate_proj.weight_scale": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.53.up_proj.weight": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.53.up_proj.weight_scale": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.54.down_proj.weight": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.54.down_proj.weight_scale": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.54.gate_proj.weight": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.54.gate_proj.weight_scale": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.54.up_proj.weight": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.54.up_proj.weight_scale": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.55.down_proj.weight": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.55.down_proj.weight_scale": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.55.gate_proj.weight": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.55.gate_proj.weight_scale": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.55.up_proj.weight": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.55.up_proj.weight_scale": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.56.down_proj.weight": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.56.down_proj.weight_scale": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.56.gate_proj.weight": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.56.gate_proj.weight_scale": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.56.up_proj.weight": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.56.up_proj.weight_scale": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.57.down_proj.weight": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.57.down_proj.weight_scale": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.57.gate_proj.weight": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.57.gate_proj.weight_scale": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.57.up_proj.weight": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.57.up_proj.weight_scale": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.58.down_proj.weight": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.58.down_proj.weight_scale": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.58.gate_proj.weight": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.58.gate_proj.weight_scale": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.58.up_proj.weight": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.58.up_proj.weight_scale": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.59.down_proj.weight": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.59.down_proj.weight_scale": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.59.gate_proj.weight": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.59.gate_proj.weight_scale": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.59.up_proj.weight": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.59.up_proj.weight_scale": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.6.down_proj.weight": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.6.down_proj.weight_scale": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.6.gate_proj.weight": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.6.gate_proj.weight_scale": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.6.up_proj.weight": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.6.up_proj.weight_scale": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.60.down_proj.weight": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.60.down_proj.weight_scale": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.60.gate_proj.weight": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.60.gate_proj.weight_scale": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.60.up_proj.weight": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.60.up_proj.weight_scale": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.61.down_proj.weight": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.61.down_proj.weight_scale": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.61.gate_proj.weight": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.61.gate_proj.weight_scale": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.61.up_proj.weight": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.61.up_proj.weight_scale": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.62.down_proj.weight": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.62.down_proj.weight_scale": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.62.gate_proj.weight": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.62.gate_proj.weight_scale": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.62.up_proj.weight": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.62.up_proj.weight_scale": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.63.down_proj.weight": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.63.down_proj.weight_scale": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.63.gate_proj.weight": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.63.gate_proj.weight_scale": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.63.up_proj.weight": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.63.up_proj.weight_scale": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.64.down_proj.weight": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.64.down_proj.weight_scale": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.64.gate_proj.weight": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.64.gate_proj.weight_scale": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.64.up_proj.weight": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.64.up_proj.weight_scale": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.65.down_proj.weight": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.65.down_proj.weight_scale": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.65.gate_proj.weight": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.65.gate_proj.weight_scale": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.65.up_proj.weight": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.65.up_proj.weight_scale": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.66.down_proj.weight": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.66.down_proj.weight_scale": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.66.gate_proj.weight": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.66.gate_proj.weight_scale": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.66.up_proj.weight": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.66.up_proj.weight_scale": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.67.down_proj.weight": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.67.down_proj.weight_scale": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.67.gate_proj.weight": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.67.gate_proj.weight_scale": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.67.up_proj.weight": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.67.up_proj.weight_scale": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.68.down_proj.weight": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.68.down_proj.weight_scale": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.68.gate_proj.weight": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.68.gate_proj.weight_scale": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.68.up_proj.weight": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.68.up_proj.weight_scale": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.69.down_proj.weight": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.69.down_proj.weight_scale": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.69.gate_proj.weight": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.69.gate_proj.weight_scale": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.69.up_proj.weight": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.69.up_proj.weight_scale": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.7.down_proj.weight": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.7.down_proj.weight_scale": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.7.gate_proj.weight": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.7.gate_proj.weight_scale": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.7.up_proj.weight": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.7.up_proj.weight_scale": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.70.down_proj.weight": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.70.down_proj.weight_scale": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.70.gate_proj.weight": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.70.gate_proj.weight_scale": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.70.up_proj.weight": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.70.up_proj.weight_scale": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.71.down_proj.weight": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.71.down_proj.weight_scale": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.71.gate_proj.weight": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.71.gate_proj.weight_scale": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.71.up_proj.weight": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.71.up_proj.weight_scale": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.72.down_proj.weight": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.72.down_proj.weight_scale": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.72.gate_proj.weight": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.72.gate_proj.weight_scale": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.72.up_proj.weight": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.72.up_proj.weight_scale": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.73.down_proj.weight": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.73.down_proj.weight_scale": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.73.gate_proj.weight": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.73.gate_proj.weight_scale": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.73.up_proj.weight": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.73.up_proj.weight_scale": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.74.down_proj.weight": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.74.down_proj.weight_scale": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.74.gate_proj.weight": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.74.gate_proj.weight_scale": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.74.up_proj.weight": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.74.up_proj.weight_scale": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.75.down_proj.weight": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.75.down_proj.weight_scale": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.75.gate_proj.weight": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.75.gate_proj.weight_scale": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.75.up_proj.weight": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.75.up_proj.weight_scale": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.76.down_proj.weight": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.76.down_proj.weight_scale": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.76.gate_proj.weight": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.76.gate_proj.weight_scale": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.76.up_proj.weight": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.76.up_proj.weight_scale": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.77.down_proj.weight": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.77.down_proj.weight_scale": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.77.gate_proj.weight": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.77.gate_proj.weight_scale": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.77.up_proj.weight": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.77.up_proj.weight_scale": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.78.down_proj.weight": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.78.down_proj.weight_scale": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.78.gate_proj.weight": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.78.gate_proj.weight_scale": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.78.up_proj.weight": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.78.up_proj.weight_scale": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.79.down_proj.weight": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.79.down_proj.weight_scale": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.79.gate_proj.weight": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.79.gate_proj.weight_scale": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.79.up_proj.weight": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.79.up_proj.weight_scale": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.8.down_proj.weight": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.8.down_proj.weight_scale": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.8.gate_proj.weight": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.8.gate_proj.weight_scale": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.8.up_proj.weight": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.8.up_proj.weight_scale": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.80.down_proj.weight": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.80.down_proj.weight_scale": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.80.gate_proj.weight": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.80.gate_proj.weight_scale": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.80.up_proj.weight": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.80.up_proj.weight_scale": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.81.down_proj.weight": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.81.down_proj.weight_scale": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.81.gate_proj.weight": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.81.gate_proj.weight_scale": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.81.up_proj.weight": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.81.up_proj.weight_scale": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.82.down_proj.weight": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.82.down_proj.weight_scale": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.82.gate_proj.weight": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.82.gate_proj.weight_scale": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.82.up_proj.weight": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.82.up_proj.weight_scale": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.83.down_proj.weight": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.83.down_proj.weight_scale": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.83.gate_proj.weight": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.83.gate_proj.weight_scale": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.83.up_proj.weight": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.83.up_proj.weight_scale": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.84.down_proj.weight": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.84.down_proj.weight_scale": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.84.gate_proj.weight": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.84.gate_proj.weight_scale": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.84.up_proj.weight": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.84.up_proj.weight_scale": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.85.down_proj.weight": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.85.down_proj.weight_scale": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.85.gate_proj.weight": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.85.gate_proj.weight_scale": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.85.up_proj.weight": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.85.up_proj.weight_scale": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.86.down_proj.weight": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.86.down_proj.weight_scale": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.86.gate_proj.weight": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.86.gate_proj.weight_scale": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.86.up_proj.weight": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.86.up_proj.weight_scale": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.87.down_proj.weight": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.87.down_proj.weight_scale": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.87.gate_proj.weight": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.87.gate_proj.weight_scale": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.87.up_proj.weight": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.87.up_proj.weight_scale": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.88.down_proj.weight": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.88.down_proj.weight_scale": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.88.gate_proj.weight": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.88.gate_proj.weight_scale": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.88.up_proj.weight": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.88.up_proj.weight_scale": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.89.down_proj.weight": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.89.down_proj.weight_scale": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.89.gate_proj.weight": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.89.gate_proj.weight_scale": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.89.up_proj.weight": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.89.up_proj.weight_scale": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.9.down_proj.weight": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.9.down_proj.weight_scale": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.9.gate_proj.weight": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.9.gate_proj.weight_scale": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.9.up_proj.weight": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.9.up_proj.weight_scale": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.90.down_proj.weight": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.90.down_proj.weight_scale": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.90.gate_proj.weight": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.90.gate_proj.weight_scale": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.90.up_proj.weight": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.90.up_proj.weight_scale": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.91.down_proj.weight": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.91.down_proj.weight_scale": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.91.gate_proj.weight": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.91.gate_proj.weight_scale": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.91.up_proj.weight": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.91.up_proj.weight_scale": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.92.down_proj.weight": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.92.down_proj.weight_scale": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.92.gate_proj.weight": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.92.gate_proj.weight_scale": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.92.up_proj.weight": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.92.up_proj.weight_scale": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.93.down_proj.weight": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.93.down_proj.weight_scale": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.93.gate_proj.weight": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.93.gate_proj.weight_scale": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.93.up_proj.weight": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.93.up_proj.weight_scale": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.94.down_proj.weight": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.94.down_proj.weight_scale": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.94.gate_proj.weight": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.94.gate_proj.weight_scale": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.94.up_proj.weight": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.94.up_proj.weight_scale": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.95.down_proj.weight": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.95.down_proj.weight_scale": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.95.gate_proj.weight": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.95.gate_proj.weight_scale": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.95.up_proj.weight": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.95.up_proj.weight_scale": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.96.down_proj.weight": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.96.down_proj.weight_scale": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.96.gate_proj.weight": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.96.gate_proj.weight_scale": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.96.up_proj.weight": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.96.up_proj.weight_scale": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.97.down_proj.weight": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.97.down_proj.weight_scale": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.97.gate_proj.weight": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.97.gate_proj.weight_scale": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.97.up_proj.weight": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.97.up_proj.weight_scale": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.98.down_proj.weight": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.98.down_proj.weight_scale": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.98.gate_proj.weight": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.98.gate_proj.weight_scale": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.98.up_proj.weight": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.98.up_proj.weight_scale": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.99.down_proj.weight": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.99.down_proj.weight_scale": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.99.gate_proj.weight": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.99.gate_proj.weight_scale": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.99.up_proj.weight": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.99.up_proj.weight_scale": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.gate.e_score_correction_bias": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.gate.weight": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.shared_experts.down_proj.weight": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.shared_experts.down_proj.weight_scale": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.shared_experts.gate_proj.weight": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.shared_experts.gate_proj.weight_scale": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.shared_experts.up_proj.weight": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.shared_experts.up_proj.weight_scale": "model-00036-of-00092.safetensors",
+ "model.layers.35.post_attention_layernorm.weight": "model-00036-of-00092.safetensors",
+ "model.layers.35.self_attn.k_norm.weight": "model-00036-of-00092.safetensors",
+ "model.layers.35.self_attn.k_proj.bias": "model-00036-of-00092.safetensors",
+ "model.layers.35.self_attn.k_proj.weight": "model-00036-of-00092.safetensors",
+ "model.layers.35.self_attn.k_proj.weight_scale": "model-00036-of-00092.safetensors",
+ "model.layers.35.self_attn.o_proj.weight": "model-00036-of-00092.safetensors",
+ "model.layers.35.self_attn.o_proj.weight_scale": "model-00036-of-00092.safetensors",
+ "model.layers.35.self_attn.q_norm.weight": "model-00036-of-00092.safetensors",
+ "model.layers.35.self_attn.q_proj.bias": "model-00036-of-00092.safetensors",
+ "model.layers.35.self_attn.q_proj.weight": "model-00036-of-00092.safetensors",
+ "model.layers.35.self_attn.q_proj.weight_scale": "model-00036-of-00092.safetensors",
+ "model.layers.35.self_attn.v_proj.bias": "model-00036-of-00092.safetensors",
+ "model.layers.35.self_attn.v_proj.weight": "model-00036-of-00092.safetensors",
+ "model.layers.35.self_attn.v_proj.weight_scale": "model-00036-of-00092.safetensors",
+ "model.layers.36.input_layernorm.weight": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.0.down_proj.weight": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.0.down_proj.weight_scale": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.0.gate_proj.weight": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.0.gate_proj.weight_scale": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.0.up_proj.weight": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.0.up_proj.weight_scale": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.1.down_proj.weight": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.1.down_proj.weight_scale": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.1.gate_proj.weight": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.1.gate_proj.weight_scale": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.1.up_proj.weight": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.1.up_proj.weight_scale": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.10.down_proj.weight": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.10.down_proj.weight_scale": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.10.gate_proj.weight": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.10.gate_proj.weight_scale": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.10.up_proj.weight": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.10.up_proj.weight_scale": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.100.down_proj.weight": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.100.down_proj.weight_scale": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.100.gate_proj.weight": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.100.gate_proj.weight_scale": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.100.up_proj.weight": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.100.up_proj.weight_scale": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.101.down_proj.weight": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.101.down_proj.weight_scale": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.101.gate_proj.weight": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.101.gate_proj.weight_scale": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.101.up_proj.weight": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.101.up_proj.weight_scale": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.102.down_proj.weight": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.102.down_proj.weight_scale": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.102.gate_proj.weight": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.102.gate_proj.weight_scale": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.102.up_proj.weight": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.102.up_proj.weight_scale": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.103.down_proj.weight": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.103.down_proj.weight_scale": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.103.gate_proj.weight": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.103.gate_proj.weight_scale": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.103.up_proj.weight": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.103.up_proj.weight_scale": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.104.down_proj.weight": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.104.down_proj.weight_scale": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.104.gate_proj.weight": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.104.gate_proj.weight_scale": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.104.up_proj.weight": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.104.up_proj.weight_scale": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.105.down_proj.weight": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.105.down_proj.weight_scale": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.105.gate_proj.weight": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.105.gate_proj.weight_scale": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.105.up_proj.weight": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.105.up_proj.weight_scale": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.106.down_proj.weight": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.106.down_proj.weight_scale": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.106.gate_proj.weight": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.106.gate_proj.weight_scale": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.106.up_proj.weight": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.106.up_proj.weight_scale": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.107.down_proj.weight": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.107.down_proj.weight_scale": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.107.gate_proj.weight": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.107.gate_proj.weight_scale": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.107.up_proj.weight": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.107.up_proj.weight_scale": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.108.down_proj.weight": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.108.down_proj.weight_scale": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.108.gate_proj.weight": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.108.gate_proj.weight_scale": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.108.up_proj.weight": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.108.up_proj.weight_scale": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.109.down_proj.weight": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.109.down_proj.weight_scale": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.109.gate_proj.weight": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.109.gate_proj.weight_scale": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.109.up_proj.weight": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.109.up_proj.weight_scale": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.11.down_proj.weight": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.11.down_proj.weight_scale": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.11.gate_proj.weight": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.11.gate_proj.weight_scale": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.11.up_proj.weight": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.11.up_proj.weight_scale": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.110.down_proj.weight": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.110.down_proj.weight_scale": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.110.gate_proj.weight": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.110.gate_proj.weight_scale": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.110.up_proj.weight": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.110.up_proj.weight_scale": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.111.down_proj.weight": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.111.down_proj.weight_scale": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.111.gate_proj.weight": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.111.gate_proj.weight_scale": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.111.up_proj.weight": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.111.up_proj.weight_scale": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.112.down_proj.weight": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.112.down_proj.weight_scale": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.112.gate_proj.weight": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.112.gate_proj.weight_scale": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.112.up_proj.weight": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.112.up_proj.weight_scale": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.113.down_proj.weight": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.113.down_proj.weight_scale": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.113.gate_proj.weight": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.113.gate_proj.weight_scale": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.113.up_proj.weight": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.113.up_proj.weight_scale": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.114.down_proj.weight": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.114.down_proj.weight_scale": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.114.gate_proj.weight": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.114.gate_proj.weight_scale": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.114.up_proj.weight": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.114.up_proj.weight_scale": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.115.down_proj.weight": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.115.down_proj.weight_scale": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.115.gate_proj.weight": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.115.gate_proj.weight_scale": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.115.up_proj.weight": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.115.up_proj.weight_scale": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.116.down_proj.weight": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.116.down_proj.weight_scale": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.116.gate_proj.weight": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.116.gate_proj.weight_scale": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.116.up_proj.weight": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.116.up_proj.weight_scale": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.117.down_proj.weight": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.117.down_proj.weight_scale": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.117.gate_proj.weight": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.117.gate_proj.weight_scale": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.117.up_proj.weight": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.117.up_proj.weight_scale": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.118.down_proj.weight": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.118.down_proj.weight_scale": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.118.gate_proj.weight": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.118.gate_proj.weight_scale": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.118.up_proj.weight": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.118.up_proj.weight_scale": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.119.down_proj.weight": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.119.down_proj.weight_scale": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.119.gate_proj.weight": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.119.gate_proj.weight_scale": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.119.up_proj.weight": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.119.up_proj.weight_scale": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.12.down_proj.weight": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.12.down_proj.weight_scale": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.12.gate_proj.weight": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.12.gate_proj.weight_scale": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.12.up_proj.weight": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.12.up_proj.weight_scale": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.120.down_proj.weight": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.120.down_proj.weight_scale": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.120.gate_proj.weight": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.120.gate_proj.weight_scale": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.120.up_proj.weight": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.120.up_proj.weight_scale": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.121.down_proj.weight": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.121.down_proj.weight_scale": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.121.gate_proj.weight": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.121.gate_proj.weight_scale": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.121.up_proj.weight": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.121.up_proj.weight_scale": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.122.down_proj.weight": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.122.down_proj.weight_scale": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.122.gate_proj.weight": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.122.gate_proj.weight_scale": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.122.up_proj.weight": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.122.up_proj.weight_scale": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.123.down_proj.weight": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.123.down_proj.weight_scale": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.123.gate_proj.weight": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.123.gate_proj.weight_scale": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.123.up_proj.weight": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.123.up_proj.weight_scale": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.124.down_proj.weight": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.124.down_proj.weight_scale": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.124.gate_proj.weight": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.124.gate_proj.weight_scale": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.124.up_proj.weight": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.124.up_proj.weight_scale": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.125.down_proj.weight": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.125.down_proj.weight_scale": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.125.gate_proj.weight": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.125.gate_proj.weight_scale": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.125.up_proj.weight": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.125.up_proj.weight_scale": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.126.down_proj.weight": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.126.down_proj.weight_scale": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.126.gate_proj.weight": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.126.gate_proj.weight_scale": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.126.up_proj.weight": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.126.up_proj.weight_scale": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.127.down_proj.weight": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.127.down_proj.weight_scale": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.127.gate_proj.weight": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.127.gate_proj.weight_scale": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.127.up_proj.weight": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.127.up_proj.weight_scale": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.128.down_proj.weight": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.128.down_proj.weight_scale": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.128.gate_proj.weight": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.128.gate_proj.weight_scale": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.128.up_proj.weight": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.128.up_proj.weight_scale": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.129.down_proj.weight": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.129.down_proj.weight_scale": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.129.gate_proj.weight": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.129.gate_proj.weight_scale": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.129.up_proj.weight": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.129.up_proj.weight_scale": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.13.down_proj.weight": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.13.down_proj.weight_scale": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.13.gate_proj.weight": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.13.gate_proj.weight_scale": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.13.up_proj.weight": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.13.up_proj.weight_scale": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.130.down_proj.weight": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.130.down_proj.weight_scale": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.130.gate_proj.weight": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.130.gate_proj.weight_scale": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.130.up_proj.weight": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.130.up_proj.weight_scale": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.131.down_proj.weight": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.131.down_proj.weight_scale": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.131.gate_proj.weight": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.131.gate_proj.weight_scale": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.131.up_proj.weight": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.131.up_proj.weight_scale": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.132.down_proj.weight": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.132.down_proj.weight_scale": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.132.gate_proj.weight": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.132.gate_proj.weight_scale": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.132.up_proj.weight": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.132.up_proj.weight_scale": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.133.down_proj.weight": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.133.down_proj.weight_scale": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.133.gate_proj.weight": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.133.gate_proj.weight_scale": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.133.up_proj.weight": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.133.up_proj.weight_scale": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.134.down_proj.weight": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.134.down_proj.weight_scale": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.134.gate_proj.weight": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.134.gate_proj.weight_scale": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.134.up_proj.weight": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.134.up_proj.weight_scale": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.135.down_proj.weight": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.135.down_proj.weight_scale": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.135.gate_proj.weight": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.135.gate_proj.weight_scale": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.135.up_proj.weight": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.135.up_proj.weight_scale": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.136.down_proj.weight": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.136.down_proj.weight_scale": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.136.gate_proj.weight": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.136.gate_proj.weight_scale": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.136.up_proj.weight": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.136.up_proj.weight_scale": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.137.down_proj.weight": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.137.down_proj.weight_scale": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.137.gate_proj.weight": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.137.gate_proj.weight_scale": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.137.up_proj.weight": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.137.up_proj.weight_scale": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.138.down_proj.weight": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.138.down_proj.weight_scale": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.138.gate_proj.weight": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.138.gate_proj.weight_scale": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.138.up_proj.weight": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.138.up_proj.weight_scale": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.139.down_proj.weight": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.139.down_proj.weight_scale": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.139.gate_proj.weight": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.139.gate_proj.weight_scale": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.139.up_proj.weight": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.139.up_proj.weight_scale": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.14.down_proj.weight": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.14.down_proj.weight_scale": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.14.gate_proj.weight": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.14.gate_proj.weight_scale": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.14.up_proj.weight": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.14.up_proj.weight_scale": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.140.down_proj.weight": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.140.down_proj.weight_scale": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.140.gate_proj.weight": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.140.gate_proj.weight_scale": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.140.up_proj.weight": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.140.up_proj.weight_scale": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.141.down_proj.weight": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.141.down_proj.weight_scale": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.141.gate_proj.weight": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.141.gate_proj.weight_scale": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.141.up_proj.weight": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.141.up_proj.weight_scale": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.142.down_proj.weight": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.142.down_proj.weight_scale": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.142.gate_proj.weight": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.142.gate_proj.weight_scale": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.142.up_proj.weight": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.142.up_proj.weight_scale": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.143.down_proj.weight": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.143.down_proj.weight_scale": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.143.gate_proj.weight": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.143.gate_proj.weight_scale": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.143.up_proj.weight": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.143.up_proj.weight_scale": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.144.down_proj.weight": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.144.down_proj.weight_scale": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.144.gate_proj.weight": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.144.gate_proj.weight_scale": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.144.up_proj.weight": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.144.up_proj.weight_scale": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.145.down_proj.weight": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.145.down_proj.weight_scale": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.145.gate_proj.weight": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.145.gate_proj.weight_scale": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.145.up_proj.weight": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.145.up_proj.weight_scale": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.146.down_proj.weight": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.146.down_proj.weight_scale": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.146.gate_proj.weight": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.146.gate_proj.weight_scale": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.146.up_proj.weight": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.146.up_proj.weight_scale": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.147.down_proj.weight": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.147.down_proj.weight_scale": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.147.gate_proj.weight": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.147.gate_proj.weight_scale": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.147.up_proj.weight": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.147.up_proj.weight_scale": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.148.down_proj.weight": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.148.down_proj.weight_scale": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.148.gate_proj.weight": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.148.gate_proj.weight_scale": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.148.up_proj.weight": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.148.up_proj.weight_scale": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.149.down_proj.weight": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.149.down_proj.weight_scale": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.149.gate_proj.weight": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.149.gate_proj.weight_scale": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.149.up_proj.weight": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.149.up_proj.weight_scale": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.15.down_proj.weight": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.15.down_proj.weight_scale": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.15.gate_proj.weight": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.15.gate_proj.weight_scale": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.15.up_proj.weight": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.15.up_proj.weight_scale": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.150.down_proj.weight": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.150.down_proj.weight_scale": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.150.gate_proj.weight": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.150.gate_proj.weight_scale": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.150.up_proj.weight": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.150.up_proj.weight_scale": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.151.down_proj.weight": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.151.down_proj.weight_scale": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.151.gate_proj.weight": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.151.gate_proj.weight_scale": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.151.up_proj.weight": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.151.up_proj.weight_scale": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.152.down_proj.weight": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.152.down_proj.weight_scale": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.152.gate_proj.weight": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.152.gate_proj.weight_scale": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.152.up_proj.weight": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.152.up_proj.weight_scale": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.153.down_proj.weight": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.153.down_proj.weight_scale": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.153.gate_proj.weight": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.153.gate_proj.weight_scale": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.153.up_proj.weight": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.153.up_proj.weight_scale": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.154.down_proj.weight": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.154.down_proj.weight_scale": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.154.gate_proj.weight": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.154.gate_proj.weight_scale": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.154.up_proj.weight": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.154.up_proj.weight_scale": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.155.down_proj.weight": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.155.down_proj.weight_scale": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.155.gate_proj.weight": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.155.gate_proj.weight_scale": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.155.up_proj.weight": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.155.up_proj.weight_scale": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.156.down_proj.weight": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.156.down_proj.weight_scale": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.156.gate_proj.weight": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.156.gate_proj.weight_scale": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.156.up_proj.weight": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.156.up_proj.weight_scale": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.157.down_proj.weight": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.157.down_proj.weight_scale": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.157.gate_proj.weight": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.157.gate_proj.weight_scale": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.157.up_proj.weight": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.157.up_proj.weight_scale": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.158.down_proj.weight": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.158.down_proj.weight_scale": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.158.gate_proj.weight": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.158.gate_proj.weight_scale": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.158.up_proj.weight": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.158.up_proj.weight_scale": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.159.down_proj.weight": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.159.down_proj.weight_scale": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.159.gate_proj.weight": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.159.gate_proj.weight_scale": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.159.up_proj.weight": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.159.up_proj.weight_scale": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.16.down_proj.weight": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.16.down_proj.weight_scale": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.16.gate_proj.weight": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.16.gate_proj.weight_scale": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.16.up_proj.weight": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.16.up_proj.weight_scale": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.17.down_proj.weight": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.17.down_proj.weight_scale": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.17.gate_proj.weight": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.17.gate_proj.weight_scale": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.17.up_proj.weight": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.17.up_proj.weight_scale": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.18.down_proj.weight": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.18.down_proj.weight_scale": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.18.gate_proj.weight": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.18.gate_proj.weight_scale": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.18.up_proj.weight": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.18.up_proj.weight_scale": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.19.down_proj.weight": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.19.down_proj.weight_scale": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.19.gate_proj.weight": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.19.gate_proj.weight_scale": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.19.up_proj.weight": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.19.up_proj.weight_scale": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.2.down_proj.weight": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.2.down_proj.weight_scale": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.2.gate_proj.weight": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.2.gate_proj.weight_scale": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.2.up_proj.weight": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.2.up_proj.weight_scale": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.20.down_proj.weight": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.20.down_proj.weight_scale": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.20.gate_proj.weight": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.20.gate_proj.weight_scale": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.20.up_proj.weight": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.20.up_proj.weight_scale": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.21.down_proj.weight": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.21.down_proj.weight_scale": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.21.gate_proj.weight": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.21.gate_proj.weight_scale": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.21.up_proj.weight": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.21.up_proj.weight_scale": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.22.down_proj.weight": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.22.down_proj.weight_scale": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.22.gate_proj.weight": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.22.gate_proj.weight_scale": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.22.up_proj.weight": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.22.up_proj.weight_scale": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.23.down_proj.weight": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.23.down_proj.weight_scale": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.23.gate_proj.weight": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.23.gate_proj.weight_scale": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.23.up_proj.weight": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.23.up_proj.weight_scale": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.24.down_proj.weight": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.24.down_proj.weight_scale": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.24.gate_proj.weight": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.24.gate_proj.weight_scale": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.24.up_proj.weight": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.24.up_proj.weight_scale": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.25.down_proj.weight": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.25.down_proj.weight_scale": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.25.gate_proj.weight": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.25.gate_proj.weight_scale": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.25.up_proj.weight": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.25.up_proj.weight_scale": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.26.down_proj.weight": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.26.down_proj.weight_scale": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.26.gate_proj.weight": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.26.gate_proj.weight_scale": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.26.up_proj.weight": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.26.up_proj.weight_scale": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.27.down_proj.weight": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.27.down_proj.weight_scale": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.27.gate_proj.weight": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.27.gate_proj.weight_scale": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.27.up_proj.weight": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.27.up_proj.weight_scale": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.28.down_proj.weight": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.28.down_proj.weight_scale": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.28.gate_proj.weight": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.28.gate_proj.weight_scale": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.28.up_proj.weight": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.28.up_proj.weight_scale": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.29.down_proj.weight": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.29.down_proj.weight_scale": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.29.gate_proj.weight": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.29.gate_proj.weight_scale": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.29.up_proj.weight": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.29.up_proj.weight_scale": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.3.down_proj.weight": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.3.down_proj.weight_scale": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.3.gate_proj.weight": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.3.gate_proj.weight_scale": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.3.up_proj.weight": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.3.up_proj.weight_scale": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.30.down_proj.weight": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.30.down_proj.weight_scale": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.30.gate_proj.weight": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.30.gate_proj.weight_scale": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.30.up_proj.weight": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.30.up_proj.weight_scale": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.31.down_proj.weight": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.31.down_proj.weight_scale": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.31.gate_proj.weight": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.31.gate_proj.weight_scale": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.31.up_proj.weight": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.31.up_proj.weight_scale": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.32.down_proj.weight": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.32.down_proj.weight_scale": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.32.gate_proj.weight": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.32.gate_proj.weight_scale": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.32.up_proj.weight": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.32.up_proj.weight_scale": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.33.down_proj.weight": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.33.down_proj.weight_scale": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.33.gate_proj.weight": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.33.gate_proj.weight_scale": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.33.up_proj.weight": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.33.up_proj.weight_scale": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.34.down_proj.weight": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.34.down_proj.weight_scale": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.34.gate_proj.weight": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.34.gate_proj.weight_scale": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.34.up_proj.weight": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.34.up_proj.weight_scale": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.35.down_proj.weight": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.35.down_proj.weight_scale": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.35.gate_proj.weight": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.35.gate_proj.weight_scale": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.35.up_proj.weight": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.35.up_proj.weight_scale": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.36.down_proj.weight": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.36.down_proj.weight_scale": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.36.gate_proj.weight": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.36.gate_proj.weight_scale": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.36.up_proj.weight": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.36.up_proj.weight_scale": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.37.down_proj.weight": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.37.down_proj.weight_scale": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.37.gate_proj.weight": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.37.gate_proj.weight_scale": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.37.up_proj.weight": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.37.up_proj.weight_scale": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.38.down_proj.weight": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.38.down_proj.weight_scale": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.38.gate_proj.weight": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.38.gate_proj.weight_scale": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.38.up_proj.weight": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.38.up_proj.weight_scale": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.39.down_proj.weight": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.39.down_proj.weight_scale": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.39.gate_proj.weight": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.39.gate_proj.weight_scale": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.39.up_proj.weight": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.39.up_proj.weight_scale": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.4.down_proj.weight": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.4.down_proj.weight_scale": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.4.gate_proj.weight": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.4.gate_proj.weight_scale": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.4.up_proj.weight": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.4.up_proj.weight_scale": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.40.down_proj.weight": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.40.down_proj.weight_scale": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.40.gate_proj.weight": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.40.gate_proj.weight_scale": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.40.up_proj.weight": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.40.up_proj.weight_scale": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.41.down_proj.weight": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.41.down_proj.weight_scale": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.41.gate_proj.weight": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.41.gate_proj.weight_scale": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.41.up_proj.weight": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.41.up_proj.weight_scale": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.42.down_proj.weight": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.42.down_proj.weight_scale": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.42.gate_proj.weight": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.42.gate_proj.weight_scale": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.42.up_proj.weight": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.42.up_proj.weight_scale": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.43.down_proj.weight": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.43.down_proj.weight_scale": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.43.gate_proj.weight": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.43.gate_proj.weight_scale": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.43.up_proj.weight": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.43.up_proj.weight_scale": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.44.down_proj.weight": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.44.down_proj.weight_scale": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.44.gate_proj.weight": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.44.gate_proj.weight_scale": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.44.up_proj.weight": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.44.up_proj.weight_scale": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.45.down_proj.weight": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.45.down_proj.weight_scale": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.45.gate_proj.weight": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.45.gate_proj.weight_scale": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.45.up_proj.weight": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.45.up_proj.weight_scale": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.46.down_proj.weight": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.46.down_proj.weight_scale": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.46.gate_proj.weight": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.46.gate_proj.weight_scale": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.46.up_proj.weight": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.46.up_proj.weight_scale": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.47.down_proj.weight": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.47.down_proj.weight_scale": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.47.gate_proj.weight": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.47.gate_proj.weight_scale": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.47.up_proj.weight": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.47.up_proj.weight_scale": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.48.down_proj.weight": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.48.down_proj.weight_scale": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.48.gate_proj.weight": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.48.gate_proj.weight_scale": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.48.up_proj.weight": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.48.up_proj.weight_scale": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.49.down_proj.weight": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.49.down_proj.weight_scale": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.49.gate_proj.weight": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.49.gate_proj.weight_scale": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.49.up_proj.weight": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.49.up_proj.weight_scale": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.5.down_proj.weight": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.5.down_proj.weight_scale": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.5.gate_proj.weight": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.5.gate_proj.weight_scale": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.5.up_proj.weight": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.5.up_proj.weight_scale": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.50.down_proj.weight": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.50.down_proj.weight_scale": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.50.gate_proj.weight": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.50.gate_proj.weight_scale": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.50.up_proj.weight": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.50.up_proj.weight_scale": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.51.down_proj.weight": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.51.down_proj.weight_scale": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.51.gate_proj.weight": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.51.gate_proj.weight_scale": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.51.up_proj.weight": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.51.up_proj.weight_scale": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.52.down_proj.weight": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.52.down_proj.weight_scale": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.52.gate_proj.weight": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.52.gate_proj.weight_scale": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.52.up_proj.weight": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.52.up_proj.weight_scale": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.53.down_proj.weight": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.53.down_proj.weight_scale": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.53.gate_proj.weight": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.53.gate_proj.weight_scale": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.53.up_proj.weight": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.53.up_proj.weight_scale": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.54.down_proj.weight": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.54.down_proj.weight_scale": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.54.gate_proj.weight": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.54.gate_proj.weight_scale": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.54.up_proj.weight": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.54.up_proj.weight_scale": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.55.down_proj.weight": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.55.down_proj.weight_scale": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.55.gate_proj.weight": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.55.gate_proj.weight_scale": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.55.up_proj.weight": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.55.up_proj.weight_scale": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.56.down_proj.weight": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.56.down_proj.weight_scale": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.56.gate_proj.weight": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.56.gate_proj.weight_scale": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.56.up_proj.weight": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.56.up_proj.weight_scale": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.57.down_proj.weight": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.57.down_proj.weight_scale": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.57.gate_proj.weight": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.57.gate_proj.weight_scale": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.57.up_proj.weight": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.57.up_proj.weight_scale": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.58.down_proj.weight": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.58.down_proj.weight_scale": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.58.gate_proj.weight": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.58.gate_proj.weight_scale": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.58.up_proj.weight": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.58.up_proj.weight_scale": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.59.down_proj.weight": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.59.down_proj.weight_scale": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.59.gate_proj.weight": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.59.gate_proj.weight_scale": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.59.up_proj.weight": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.59.up_proj.weight_scale": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.6.down_proj.weight": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.6.down_proj.weight_scale": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.6.gate_proj.weight": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.6.gate_proj.weight_scale": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.6.up_proj.weight": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.6.up_proj.weight_scale": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.60.down_proj.weight": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.60.down_proj.weight_scale": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.60.gate_proj.weight": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.60.gate_proj.weight_scale": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.60.up_proj.weight": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.60.up_proj.weight_scale": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.61.down_proj.weight": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.61.down_proj.weight_scale": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.61.gate_proj.weight": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.61.gate_proj.weight_scale": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.61.up_proj.weight": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.61.up_proj.weight_scale": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.62.down_proj.weight": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.62.down_proj.weight_scale": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.62.gate_proj.weight": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.62.gate_proj.weight_scale": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.62.up_proj.weight": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.62.up_proj.weight_scale": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.63.down_proj.weight": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.63.down_proj.weight_scale": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.63.gate_proj.weight": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.63.gate_proj.weight_scale": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.63.up_proj.weight": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.63.up_proj.weight_scale": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.64.down_proj.weight": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.64.down_proj.weight_scale": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.64.gate_proj.weight": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.64.gate_proj.weight_scale": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.64.up_proj.weight": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.64.up_proj.weight_scale": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.65.down_proj.weight": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.65.down_proj.weight_scale": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.65.gate_proj.weight": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.65.gate_proj.weight_scale": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.65.up_proj.weight": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.65.up_proj.weight_scale": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.66.down_proj.weight": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.66.down_proj.weight_scale": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.66.gate_proj.weight": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.66.gate_proj.weight_scale": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.66.up_proj.weight": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.66.up_proj.weight_scale": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.67.down_proj.weight": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.67.down_proj.weight_scale": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.67.gate_proj.weight": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.67.gate_proj.weight_scale": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.67.up_proj.weight": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.67.up_proj.weight_scale": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.68.down_proj.weight": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.68.down_proj.weight_scale": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.68.gate_proj.weight": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.68.gate_proj.weight_scale": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.68.up_proj.weight": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.68.up_proj.weight_scale": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.69.down_proj.weight": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.69.down_proj.weight_scale": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.69.gate_proj.weight": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.69.gate_proj.weight_scale": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.69.up_proj.weight": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.69.up_proj.weight_scale": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.7.down_proj.weight": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.7.down_proj.weight_scale": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.7.gate_proj.weight": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.7.gate_proj.weight_scale": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.7.up_proj.weight": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.7.up_proj.weight_scale": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.70.down_proj.weight": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.70.down_proj.weight_scale": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.70.gate_proj.weight": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.70.gate_proj.weight_scale": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.70.up_proj.weight": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.70.up_proj.weight_scale": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.71.down_proj.weight": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.71.down_proj.weight_scale": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.71.gate_proj.weight": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.71.gate_proj.weight_scale": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.71.up_proj.weight": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.71.up_proj.weight_scale": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.72.down_proj.weight": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.72.down_proj.weight_scale": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.72.gate_proj.weight": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.72.gate_proj.weight_scale": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.72.up_proj.weight": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.72.up_proj.weight_scale": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.73.down_proj.weight": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.73.down_proj.weight_scale": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.73.gate_proj.weight": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.73.gate_proj.weight_scale": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.73.up_proj.weight": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.73.up_proj.weight_scale": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.74.down_proj.weight": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.74.down_proj.weight_scale": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.74.gate_proj.weight": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.74.gate_proj.weight_scale": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.74.up_proj.weight": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.74.up_proj.weight_scale": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.75.down_proj.weight": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.75.down_proj.weight_scale": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.75.gate_proj.weight": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.75.gate_proj.weight_scale": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.75.up_proj.weight": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.75.up_proj.weight_scale": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.76.down_proj.weight": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.76.down_proj.weight_scale": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.76.gate_proj.weight": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.76.gate_proj.weight_scale": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.76.up_proj.weight": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.76.up_proj.weight_scale": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.77.down_proj.weight": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.77.down_proj.weight_scale": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.77.gate_proj.weight": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.77.gate_proj.weight_scale": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.77.up_proj.weight": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.77.up_proj.weight_scale": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.78.down_proj.weight": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.78.down_proj.weight_scale": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.78.gate_proj.weight": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.78.gate_proj.weight_scale": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.78.up_proj.weight": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.78.up_proj.weight_scale": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.79.down_proj.weight": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.79.down_proj.weight_scale": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.79.gate_proj.weight": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.79.gate_proj.weight_scale": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.79.up_proj.weight": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.79.up_proj.weight_scale": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.8.down_proj.weight": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.8.down_proj.weight_scale": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.8.gate_proj.weight": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.8.gate_proj.weight_scale": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.8.up_proj.weight": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.8.up_proj.weight_scale": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.80.down_proj.weight": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.80.down_proj.weight_scale": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.80.gate_proj.weight": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.80.gate_proj.weight_scale": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.80.up_proj.weight": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.80.up_proj.weight_scale": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.81.down_proj.weight": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.81.down_proj.weight_scale": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.81.gate_proj.weight": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.81.gate_proj.weight_scale": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.81.up_proj.weight": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.81.up_proj.weight_scale": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.82.down_proj.weight": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.82.down_proj.weight_scale": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.82.gate_proj.weight": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.82.gate_proj.weight_scale": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.82.up_proj.weight": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.82.up_proj.weight_scale": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.83.down_proj.weight": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.83.down_proj.weight_scale": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.83.gate_proj.weight": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.83.gate_proj.weight_scale": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.83.up_proj.weight": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.83.up_proj.weight_scale": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.84.down_proj.weight": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.84.down_proj.weight_scale": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.84.gate_proj.weight": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.84.gate_proj.weight_scale": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.84.up_proj.weight": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.84.up_proj.weight_scale": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.85.down_proj.weight": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.85.down_proj.weight_scale": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.85.gate_proj.weight": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.85.gate_proj.weight_scale": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.85.up_proj.weight": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.85.up_proj.weight_scale": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.86.down_proj.weight": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.86.down_proj.weight_scale": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.86.gate_proj.weight": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.86.gate_proj.weight_scale": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.86.up_proj.weight": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.86.up_proj.weight_scale": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.87.down_proj.weight": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.87.down_proj.weight_scale": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.87.gate_proj.weight": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.87.gate_proj.weight_scale": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.87.up_proj.weight": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.87.up_proj.weight_scale": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.88.down_proj.weight": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.88.down_proj.weight_scale": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.88.gate_proj.weight": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.88.gate_proj.weight_scale": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.88.up_proj.weight": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.88.up_proj.weight_scale": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.89.down_proj.weight": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.89.down_proj.weight_scale": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.89.gate_proj.weight": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.89.gate_proj.weight_scale": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.89.up_proj.weight": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.89.up_proj.weight_scale": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.9.down_proj.weight": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.9.down_proj.weight_scale": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.9.gate_proj.weight": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.9.gate_proj.weight_scale": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.9.up_proj.weight": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.9.up_proj.weight_scale": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.90.down_proj.weight": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.90.down_proj.weight_scale": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.90.gate_proj.weight": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.90.gate_proj.weight_scale": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.90.up_proj.weight": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.90.up_proj.weight_scale": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.91.down_proj.weight": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.91.down_proj.weight_scale": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.91.gate_proj.weight": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.91.gate_proj.weight_scale": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.91.up_proj.weight": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.91.up_proj.weight_scale": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.92.down_proj.weight": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.92.down_proj.weight_scale": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.92.gate_proj.weight": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.92.gate_proj.weight_scale": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.92.up_proj.weight": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.92.up_proj.weight_scale": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.93.down_proj.weight": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.93.down_proj.weight_scale": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.93.gate_proj.weight": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.93.gate_proj.weight_scale": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.93.up_proj.weight": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.93.up_proj.weight_scale": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.94.down_proj.weight": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.94.down_proj.weight_scale": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.94.gate_proj.weight": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.94.gate_proj.weight_scale": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.94.up_proj.weight": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.94.up_proj.weight_scale": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.95.down_proj.weight": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.95.down_proj.weight_scale": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.95.gate_proj.weight": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.95.gate_proj.weight_scale": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.95.up_proj.weight": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.95.up_proj.weight_scale": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.96.down_proj.weight": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.96.down_proj.weight_scale": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.96.gate_proj.weight": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.96.gate_proj.weight_scale": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.96.up_proj.weight": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.96.up_proj.weight_scale": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.97.down_proj.weight": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.97.down_proj.weight_scale": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.97.gate_proj.weight": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.97.gate_proj.weight_scale": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.97.up_proj.weight": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.97.up_proj.weight_scale": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.98.down_proj.weight": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.98.down_proj.weight_scale": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.98.gate_proj.weight": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.98.gate_proj.weight_scale": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.98.up_proj.weight": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.98.up_proj.weight_scale": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.99.down_proj.weight": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.99.down_proj.weight_scale": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.99.gate_proj.weight": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.99.gate_proj.weight_scale": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.99.up_proj.weight": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.99.up_proj.weight_scale": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.gate.e_score_correction_bias": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.gate.weight": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.shared_experts.down_proj.weight": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.shared_experts.down_proj.weight_scale": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.shared_experts.gate_proj.weight": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.shared_experts.gate_proj.weight_scale": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.shared_experts.up_proj.weight": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.shared_experts.up_proj.weight_scale": "model-00037-of-00092.safetensors",
+ "model.layers.36.post_attention_layernorm.weight": "model-00037-of-00092.safetensors",
+ "model.layers.36.self_attn.k_norm.weight": "model-00037-of-00092.safetensors",
+ "model.layers.36.self_attn.k_proj.bias": "model-00037-of-00092.safetensors",
+ "model.layers.36.self_attn.k_proj.weight": "model-00037-of-00092.safetensors",
+ "model.layers.36.self_attn.k_proj.weight_scale": "model-00037-of-00092.safetensors",
+ "model.layers.36.self_attn.o_proj.weight": "model-00037-of-00092.safetensors",
+ "model.layers.36.self_attn.o_proj.weight_scale": "model-00037-of-00092.safetensors",
+ "model.layers.36.self_attn.q_norm.weight": "model-00037-of-00092.safetensors",
+ "model.layers.36.self_attn.q_proj.bias": "model-00037-of-00092.safetensors",
+ "model.layers.36.self_attn.q_proj.weight": "model-00037-of-00092.safetensors",
+ "model.layers.36.self_attn.q_proj.weight_scale": "model-00037-of-00092.safetensors",
+ "model.layers.36.self_attn.v_proj.bias": "model-00037-of-00092.safetensors",
+ "model.layers.36.self_attn.v_proj.weight": "model-00037-of-00092.safetensors",
+ "model.layers.36.self_attn.v_proj.weight_scale": "model-00037-of-00092.safetensors",
+ "model.layers.37.input_layernorm.weight": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.0.down_proj.weight": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.0.down_proj.weight_scale": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.0.gate_proj.weight": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.0.gate_proj.weight_scale": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.0.up_proj.weight": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.0.up_proj.weight_scale": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.1.down_proj.weight": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.1.down_proj.weight_scale": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.1.gate_proj.weight": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.1.gate_proj.weight_scale": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.1.up_proj.weight": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.1.up_proj.weight_scale": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.10.down_proj.weight": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.10.down_proj.weight_scale": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.10.gate_proj.weight": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.10.gate_proj.weight_scale": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.10.up_proj.weight": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.10.up_proj.weight_scale": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.100.down_proj.weight": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.100.down_proj.weight_scale": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.100.gate_proj.weight": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.100.gate_proj.weight_scale": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.100.up_proj.weight": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.100.up_proj.weight_scale": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.101.down_proj.weight": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.101.down_proj.weight_scale": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.101.gate_proj.weight": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.101.gate_proj.weight_scale": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.101.up_proj.weight": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.101.up_proj.weight_scale": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.102.down_proj.weight": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.102.down_proj.weight_scale": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.102.gate_proj.weight": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.102.gate_proj.weight_scale": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.102.up_proj.weight": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.102.up_proj.weight_scale": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.103.down_proj.weight": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.103.down_proj.weight_scale": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.103.gate_proj.weight": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.103.gate_proj.weight_scale": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.103.up_proj.weight": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.103.up_proj.weight_scale": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.104.down_proj.weight": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.104.down_proj.weight_scale": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.104.gate_proj.weight": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.104.gate_proj.weight_scale": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.104.up_proj.weight": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.104.up_proj.weight_scale": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.105.down_proj.weight": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.105.down_proj.weight_scale": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.105.gate_proj.weight": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.105.gate_proj.weight_scale": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.105.up_proj.weight": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.105.up_proj.weight_scale": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.106.down_proj.weight": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.106.down_proj.weight_scale": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.106.gate_proj.weight": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.106.gate_proj.weight_scale": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.106.up_proj.weight": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.106.up_proj.weight_scale": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.107.down_proj.weight": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.107.down_proj.weight_scale": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.107.gate_proj.weight": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.107.gate_proj.weight_scale": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.107.up_proj.weight": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.107.up_proj.weight_scale": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.108.down_proj.weight": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.108.down_proj.weight_scale": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.108.gate_proj.weight": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.108.gate_proj.weight_scale": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.108.up_proj.weight": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.108.up_proj.weight_scale": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.109.down_proj.weight": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.109.down_proj.weight_scale": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.109.gate_proj.weight": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.109.gate_proj.weight_scale": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.109.up_proj.weight": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.109.up_proj.weight_scale": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.11.down_proj.weight": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.11.down_proj.weight_scale": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.11.gate_proj.weight": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.11.gate_proj.weight_scale": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.11.up_proj.weight": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.11.up_proj.weight_scale": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.110.down_proj.weight": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.110.down_proj.weight_scale": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.110.gate_proj.weight": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.110.gate_proj.weight_scale": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.110.up_proj.weight": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.110.up_proj.weight_scale": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.111.down_proj.weight": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.111.down_proj.weight_scale": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.111.gate_proj.weight": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.111.gate_proj.weight_scale": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.111.up_proj.weight": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.111.up_proj.weight_scale": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.112.down_proj.weight": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.112.down_proj.weight_scale": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.112.gate_proj.weight": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.112.gate_proj.weight_scale": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.112.up_proj.weight": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.112.up_proj.weight_scale": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.113.down_proj.weight": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.113.down_proj.weight_scale": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.113.gate_proj.weight": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.113.gate_proj.weight_scale": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.113.up_proj.weight": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.113.up_proj.weight_scale": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.114.down_proj.weight": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.114.down_proj.weight_scale": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.114.gate_proj.weight": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.114.gate_proj.weight_scale": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.114.up_proj.weight": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.114.up_proj.weight_scale": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.115.down_proj.weight": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.115.down_proj.weight_scale": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.115.gate_proj.weight": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.115.gate_proj.weight_scale": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.115.up_proj.weight": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.115.up_proj.weight_scale": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.116.down_proj.weight": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.116.down_proj.weight_scale": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.116.gate_proj.weight": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.116.gate_proj.weight_scale": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.116.up_proj.weight": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.116.up_proj.weight_scale": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.117.down_proj.weight": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.117.down_proj.weight_scale": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.117.gate_proj.weight": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.117.gate_proj.weight_scale": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.117.up_proj.weight": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.117.up_proj.weight_scale": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.118.down_proj.weight": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.118.down_proj.weight_scale": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.118.gate_proj.weight": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.118.gate_proj.weight_scale": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.118.up_proj.weight": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.118.up_proj.weight_scale": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.119.down_proj.weight": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.119.down_proj.weight_scale": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.119.gate_proj.weight": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.119.gate_proj.weight_scale": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.119.up_proj.weight": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.119.up_proj.weight_scale": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.12.down_proj.weight": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.12.down_proj.weight_scale": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.12.gate_proj.weight": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.12.gate_proj.weight_scale": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.12.up_proj.weight": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.12.up_proj.weight_scale": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.120.down_proj.weight": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.120.down_proj.weight_scale": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.120.gate_proj.weight": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.120.gate_proj.weight_scale": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.120.up_proj.weight": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.120.up_proj.weight_scale": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.121.down_proj.weight": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.121.down_proj.weight_scale": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.121.gate_proj.weight": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.121.gate_proj.weight_scale": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.121.up_proj.weight": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.121.up_proj.weight_scale": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.122.down_proj.weight": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.122.down_proj.weight_scale": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.122.gate_proj.weight": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.122.gate_proj.weight_scale": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.122.up_proj.weight": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.122.up_proj.weight_scale": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.123.down_proj.weight": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.123.down_proj.weight_scale": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.123.gate_proj.weight": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.123.gate_proj.weight_scale": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.123.up_proj.weight": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.123.up_proj.weight_scale": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.124.down_proj.weight": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.124.down_proj.weight_scale": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.124.gate_proj.weight": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.124.gate_proj.weight_scale": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.124.up_proj.weight": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.124.up_proj.weight_scale": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.125.down_proj.weight": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.125.down_proj.weight_scale": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.125.gate_proj.weight": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.125.gate_proj.weight_scale": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.125.up_proj.weight": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.125.up_proj.weight_scale": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.126.down_proj.weight": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.126.down_proj.weight_scale": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.126.gate_proj.weight": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.126.gate_proj.weight_scale": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.126.up_proj.weight": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.126.up_proj.weight_scale": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.127.down_proj.weight": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.127.down_proj.weight_scale": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.127.gate_proj.weight": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.127.gate_proj.weight_scale": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.127.up_proj.weight": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.127.up_proj.weight_scale": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.128.down_proj.weight": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.128.down_proj.weight_scale": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.128.gate_proj.weight": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.128.gate_proj.weight_scale": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.128.up_proj.weight": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.128.up_proj.weight_scale": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.129.down_proj.weight": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.129.down_proj.weight_scale": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.129.gate_proj.weight": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.129.gate_proj.weight_scale": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.129.up_proj.weight": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.129.up_proj.weight_scale": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.13.down_proj.weight": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.13.down_proj.weight_scale": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.13.gate_proj.weight": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.13.gate_proj.weight_scale": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.13.up_proj.weight": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.13.up_proj.weight_scale": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.130.down_proj.weight": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.130.down_proj.weight_scale": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.130.gate_proj.weight": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.130.gate_proj.weight_scale": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.130.up_proj.weight": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.130.up_proj.weight_scale": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.131.down_proj.weight": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.131.down_proj.weight_scale": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.131.gate_proj.weight": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.131.gate_proj.weight_scale": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.131.up_proj.weight": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.131.up_proj.weight_scale": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.132.down_proj.weight": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.132.down_proj.weight_scale": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.132.gate_proj.weight": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.132.gate_proj.weight_scale": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.132.up_proj.weight": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.132.up_proj.weight_scale": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.133.down_proj.weight": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.133.down_proj.weight_scale": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.133.gate_proj.weight": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.133.gate_proj.weight_scale": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.133.up_proj.weight": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.133.up_proj.weight_scale": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.134.down_proj.weight": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.134.down_proj.weight_scale": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.134.gate_proj.weight": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.134.gate_proj.weight_scale": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.134.up_proj.weight": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.134.up_proj.weight_scale": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.135.down_proj.weight": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.135.down_proj.weight_scale": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.135.gate_proj.weight": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.135.gate_proj.weight_scale": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.135.up_proj.weight": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.135.up_proj.weight_scale": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.136.down_proj.weight": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.136.down_proj.weight_scale": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.136.gate_proj.weight": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.136.gate_proj.weight_scale": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.136.up_proj.weight": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.136.up_proj.weight_scale": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.137.down_proj.weight": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.137.down_proj.weight_scale": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.137.gate_proj.weight": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.137.gate_proj.weight_scale": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.137.up_proj.weight": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.137.up_proj.weight_scale": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.138.down_proj.weight": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.138.down_proj.weight_scale": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.138.gate_proj.weight": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.138.gate_proj.weight_scale": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.138.up_proj.weight": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.138.up_proj.weight_scale": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.139.down_proj.weight": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.139.down_proj.weight_scale": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.139.gate_proj.weight": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.139.gate_proj.weight_scale": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.139.up_proj.weight": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.139.up_proj.weight_scale": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.14.down_proj.weight": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.14.down_proj.weight_scale": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.14.gate_proj.weight": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.14.gate_proj.weight_scale": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.14.up_proj.weight": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.14.up_proj.weight_scale": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.140.down_proj.weight": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.140.down_proj.weight_scale": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.140.gate_proj.weight": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.140.gate_proj.weight_scale": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.140.up_proj.weight": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.140.up_proj.weight_scale": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.141.down_proj.weight": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.141.down_proj.weight_scale": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.141.gate_proj.weight": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.141.gate_proj.weight_scale": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.141.up_proj.weight": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.141.up_proj.weight_scale": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.142.down_proj.weight": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.142.down_proj.weight_scale": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.142.gate_proj.weight": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.142.gate_proj.weight_scale": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.142.up_proj.weight": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.142.up_proj.weight_scale": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.143.down_proj.weight": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.143.down_proj.weight_scale": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.143.gate_proj.weight": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.143.gate_proj.weight_scale": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.143.up_proj.weight": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.143.up_proj.weight_scale": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.144.down_proj.weight": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.144.down_proj.weight_scale": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.144.gate_proj.weight": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.144.gate_proj.weight_scale": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.144.up_proj.weight": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.144.up_proj.weight_scale": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.145.down_proj.weight": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.145.down_proj.weight_scale": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.145.gate_proj.weight": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.145.gate_proj.weight_scale": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.145.up_proj.weight": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.145.up_proj.weight_scale": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.146.down_proj.weight": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.146.down_proj.weight_scale": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.146.gate_proj.weight": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.146.gate_proj.weight_scale": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.146.up_proj.weight": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.146.up_proj.weight_scale": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.147.down_proj.weight": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.147.down_proj.weight_scale": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.147.gate_proj.weight": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.147.gate_proj.weight_scale": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.147.up_proj.weight": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.147.up_proj.weight_scale": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.148.down_proj.weight": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.148.down_proj.weight_scale": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.148.gate_proj.weight": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.148.gate_proj.weight_scale": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.148.up_proj.weight": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.148.up_proj.weight_scale": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.149.down_proj.weight": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.149.down_proj.weight_scale": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.149.gate_proj.weight": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.149.gate_proj.weight_scale": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.149.up_proj.weight": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.149.up_proj.weight_scale": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.15.down_proj.weight": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.15.down_proj.weight_scale": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.15.gate_proj.weight": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.15.gate_proj.weight_scale": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.15.up_proj.weight": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.15.up_proj.weight_scale": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.150.down_proj.weight": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.150.down_proj.weight_scale": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.150.gate_proj.weight": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.150.gate_proj.weight_scale": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.150.up_proj.weight": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.150.up_proj.weight_scale": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.151.down_proj.weight": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.151.down_proj.weight_scale": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.151.gate_proj.weight": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.151.gate_proj.weight_scale": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.151.up_proj.weight": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.151.up_proj.weight_scale": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.152.down_proj.weight": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.152.down_proj.weight_scale": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.152.gate_proj.weight": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.152.gate_proj.weight_scale": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.152.up_proj.weight": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.152.up_proj.weight_scale": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.153.down_proj.weight": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.153.down_proj.weight_scale": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.153.gate_proj.weight": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.153.gate_proj.weight_scale": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.153.up_proj.weight": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.153.up_proj.weight_scale": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.154.down_proj.weight": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.154.down_proj.weight_scale": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.154.gate_proj.weight": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.154.gate_proj.weight_scale": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.154.up_proj.weight": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.154.up_proj.weight_scale": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.155.down_proj.weight": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.155.down_proj.weight_scale": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.155.gate_proj.weight": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.155.gate_proj.weight_scale": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.155.up_proj.weight": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.155.up_proj.weight_scale": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.156.down_proj.weight": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.156.down_proj.weight_scale": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.156.gate_proj.weight": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.156.gate_proj.weight_scale": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.156.up_proj.weight": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.156.up_proj.weight_scale": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.157.down_proj.weight": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.157.down_proj.weight_scale": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.157.gate_proj.weight": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.157.gate_proj.weight_scale": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.157.up_proj.weight": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.157.up_proj.weight_scale": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.158.down_proj.weight": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.158.down_proj.weight_scale": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.158.gate_proj.weight": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.158.gate_proj.weight_scale": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.158.up_proj.weight": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.158.up_proj.weight_scale": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.159.down_proj.weight": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.159.down_proj.weight_scale": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.159.gate_proj.weight": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.159.gate_proj.weight_scale": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.159.up_proj.weight": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.159.up_proj.weight_scale": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.16.down_proj.weight": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.16.down_proj.weight_scale": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.16.gate_proj.weight": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.16.gate_proj.weight_scale": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.16.up_proj.weight": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.16.up_proj.weight_scale": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.17.down_proj.weight": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.17.down_proj.weight_scale": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.17.gate_proj.weight": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.17.gate_proj.weight_scale": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.17.up_proj.weight": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.17.up_proj.weight_scale": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.18.down_proj.weight": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.18.down_proj.weight_scale": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.18.gate_proj.weight": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.18.gate_proj.weight_scale": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.18.up_proj.weight": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.18.up_proj.weight_scale": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.19.down_proj.weight": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.19.down_proj.weight_scale": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.19.gate_proj.weight": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.19.gate_proj.weight_scale": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.19.up_proj.weight": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.19.up_proj.weight_scale": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.2.down_proj.weight": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.2.down_proj.weight_scale": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.2.gate_proj.weight": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.2.gate_proj.weight_scale": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.2.up_proj.weight": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.2.up_proj.weight_scale": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.20.down_proj.weight": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.20.down_proj.weight_scale": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.20.gate_proj.weight": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.20.gate_proj.weight_scale": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.20.up_proj.weight": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.20.up_proj.weight_scale": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.21.down_proj.weight": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.21.down_proj.weight_scale": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.21.gate_proj.weight": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.21.gate_proj.weight_scale": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.21.up_proj.weight": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.21.up_proj.weight_scale": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.22.down_proj.weight": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.22.down_proj.weight_scale": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.22.gate_proj.weight": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.22.gate_proj.weight_scale": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.22.up_proj.weight": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.22.up_proj.weight_scale": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.23.down_proj.weight": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.23.down_proj.weight_scale": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.23.gate_proj.weight": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.23.gate_proj.weight_scale": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.23.up_proj.weight": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.23.up_proj.weight_scale": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.24.down_proj.weight": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.24.down_proj.weight_scale": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.24.gate_proj.weight": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.24.gate_proj.weight_scale": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.24.up_proj.weight": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.24.up_proj.weight_scale": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.25.down_proj.weight": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.25.down_proj.weight_scale": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.25.gate_proj.weight": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.25.gate_proj.weight_scale": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.25.up_proj.weight": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.25.up_proj.weight_scale": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.26.down_proj.weight": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.26.down_proj.weight_scale": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.26.gate_proj.weight": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.26.gate_proj.weight_scale": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.26.up_proj.weight": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.26.up_proj.weight_scale": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.27.down_proj.weight": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.27.down_proj.weight_scale": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.27.gate_proj.weight": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.27.gate_proj.weight_scale": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.27.up_proj.weight": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.27.up_proj.weight_scale": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.28.down_proj.weight": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.28.down_proj.weight_scale": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.28.gate_proj.weight": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.28.gate_proj.weight_scale": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.28.up_proj.weight": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.28.up_proj.weight_scale": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.29.down_proj.weight": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.29.down_proj.weight_scale": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.29.gate_proj.weight": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.29.gate_proj.weight_scale": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.29.up_proj.weight": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.29.up_proj.weight_scale": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.3.down_proj.weight": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.3.down_proj.weight_scale": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.3.gate_proj.weight": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.3.gate_proj.weight_scale": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.3.up_proj.weight": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.3.up_proj.weight_scale": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.30.down_proj.weight": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.30.down_proj.weight_scale": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.30.gate_proj.weight": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.30.gate_proj.weight_scale": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.30.up_proj.weight": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.30.up_proj.weight_scale": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.31.down_proj.weight": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.31.down_proj.weight_scale": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.31.gate_proj.weight": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.31.gate_proj.weight_scale": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.31.up_proj.weight": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.31.up_proj.weight_scale": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.32.down_proj.weight": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.32.down_proj.weight_scale": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.32.gate_proj.weight": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.32.gate_proj.weight_scale": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.32.up_proj.weight": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.32.up_proj.weight_scale": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.33.down_proj.weight": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.33.down_proj.weight_scale": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.33.gate_proj.weight": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.33.gate_proj.weight_scale": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.33.up_proj.weight": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.33.up_proj.weight_scale": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.34.down_proj.weight": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.34.down_proj.weight_scale": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.34.gate_proj.weight": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.34.gate_proj.weight_scale": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.34.up_proj.weight": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.34.up_proj.weight_scale": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.35.down_proj.weight": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.35.down_proj.weight_scale": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.35.gate_proj.weight": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.35.gate_proj.weight_scale": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.35.up_proj.weight": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.35.up_proj.weight_scale": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.36.down_proj.weight": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.36.down_proj.weight_scale": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.36.gate_proj.weight": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.36.gate_proj.weight_scale": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.36.up_proj.weight": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.36.up_proj.weight_scale": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.37.down_proj.weight": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.37.down_proj.weight_scale": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.37.gate_proj.weight": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.37.gate_proj.weight_scale": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.37.up_proj.weight": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.37.up_proj.weight_scale": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.38.down_proj.weight": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.38.down_proj.weight_scale": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.38.gate_proj.weight": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.38.gate_proj.weight_scale": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.38.up_proj.weight": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.38.up_proj.weight_scale": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.39.down_proj.weight": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.39.down_proj.weight_scale": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.39.gate_proj.weight": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.39.gate_proj.weight_scale": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.39.up_proj.weight": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.39.up_proj.weight_scale": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.4.down_proj.weight": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.4.down_proj.weight_scale": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.4.gate_proj.weight": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.4.gate_proj.weight_scale": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.4.up_proj.weight": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.4.up_proj.weight_scale": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.40.down_proj.weight": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.40.down_proj.weight_scale": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.40.gate_proj.weight": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.40.gate_proj.weight_scale": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.40.up_proj.weight": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.40.up_proj.weight_scale": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.41.down_proj.weight": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.41.down_proj.weight_scale": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.41.gate_proj.weight": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.41.gate_proj.weight_scale": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.41.up_proj.weight": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.41.up_proj.weight_scale": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.42.down_proj.weight": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.42.down_proj.weight_scale": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.42.gate_proj.weight": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.42.gate_proj.weight_scale": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.42.up_proj.weight": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.42.up_proj.weight_scale": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.43.down_proj.weight": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.43.down_proj.weight_scale": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.43.gate_proj.weight": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.43.gate_proj.weight_scale": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.43.up_proj.weight": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.43.up_proj.weight_scale": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.44.down_proj.weight": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.44.down_proj.weight_scale": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.44.gate_proj.weight": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.44.gate_proj.weight_scale": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.44.up_proj.weight": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.44.up_proj.weight_scale": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.45.down_proj.weight": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.45.down_proj.weight_scale": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.45.gate_proj.weight": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.45.gate_proj.weight_scale": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.45.up_proj.weight": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.45.up_proj.weight_scale": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.46.down_proj.weight": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.46.down_proj.weight_scale": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.46.gate_proj.weight": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.46.gate_proj.weight_scale": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.46.up_proj.weight": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.46.up_proj.weight_scale": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.47.down_proj.weight": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.47.down_proj.weight_scale": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.47.gate_proj.weight": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.47.gate_proj.weight_scale": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.47.up_proj.weight": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.47.up_proj.weight_scale": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.48.down_proj.weight": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.48.down_proj.weight_scale": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.48.gate_proj.weight": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.48.gate_proj.weight_scale": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.48.up_proj.weight": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.48.up_proj.weight_scale": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.49.down_proj.weight": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.49.down_proj.weight_scale": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.49.gate_proj.weight": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.49.gate_proj.weight_scale": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.49.up_proj.weight": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.49.up_proj.weight_scale": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.5.down_proj.weight": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.5.down_proj.weight_scale": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.5.gate_proj.weight": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.5.gate_proj.weight_scale": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.5.up_proj.weight": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.5.up_proj.weight_scale": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.50.down_proj.weight": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.50.down_proj.weight_scale": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.50.gate_proj.weight": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.50.gate_proj.weight_scale": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.50.up_proj.weight": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.50.up_proj.weight_scale": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.51.down_proj.weight": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.51.down_proj.weight_scale": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.51.gate_proj.weight": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.51.gate_proj.weight_scale": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.51.up_proj.weight": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.51.up_proj.weight_scale": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.52.down_proj.weight": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.52.down_proj.weight_scale": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.52.gate_proj.weight": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.52.gate_proj.weight_scale": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.52.up_proj.weight": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.52.up_proj.weight_scale": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.53.down_proj.weight": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.53.down_proj.weight_scale": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.53.gate_proj.weight": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.53.gate_proj.weight_scale": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.53.up_proj.weight": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.53.up_proj.weight_scale": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.54.down_proj.weight": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.54.down_proj.weight_scale": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.54.gate_proj.weight": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.54.gate_proj.weight_scale": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.54.up_proj.weight": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.54.up_proj.weight_scale": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.55.down_proj.weight": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.55.down_proj.weight_scale": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.55.gate_proj.weight": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.55.gate_proj.weight_scale": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.55.up_proj.weight": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.55.up_proj.weight_scale": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.56.down_proj.weight": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.56.down_proj.weight_scale": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.56.gate_proj.weight": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.56.gate_proj.weight_scale": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.56.up_proj.weight": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.56.up_proj.weight_scale": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.57.down_proj.weight": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.57.down_proj.weight_scale": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.57.gate_proj.weight": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.57.gate_proj.weight_scale": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.57.up_proj.weight": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.57.up_proj.weight_scale": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.58.down_proj.weight": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.58.down_proj.weight_scale": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.58.gate_proj.weight": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.58.gate_proj.weight_scale": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.58.up_proj.weight": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.58.up_proj.weight_scale": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.59.down_proj.weight": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.59.down_proj.weight_scale": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.59.gate_proj.weight": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.59.gate_proj.weight_scale": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.59.up_proj.weight": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.59.up_proj.weight_scale": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.6.down_proj.weight": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.6.down_proj.weight_scale": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.6.gate_proj.weight": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.6.gate_proj.weight_scale": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.6.up_proj.weight": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.6.up_proj.weight_scale": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.60.down_proj.weight": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.60.down_proj.weight_scale": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.60.gate_proj.weight": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.60.gate_proj.weight_scale": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.60.up_proj.weight": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.60.up_proj.weight_scale": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.61.down_proj.weight": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.61.down_proj.weight_scale": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.61.gate_proj.weight": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.61.gate_proj.weight_scale": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.61.up_proj.weight": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.61.up_proj.weight_scale": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.62.down_proj.weight": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.62.down_proj.weight_scale": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.62.gate_proj.weight": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.62.gate_proj.weight_scale": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.62.up_proj.weight": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.62.up_proj.weight_scale": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.63.down_proj.weight": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.63.down_proj.weight_scale": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.63.gate_proj.weight": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.63.gate_proj.weight_scale": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.63.up_proj.weight": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.63.up_proj.weight_scale": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.64.down_proj.weight": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.64.down_proj.weight_scale": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.64.gate_proj.weight": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.64.gate_proj.weight_scale": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.64.up_proj.weight": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.64.up_proj.weight_scale": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.65.down_proj.weight": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.65.down_proj.weight_scale": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.65.gate_proj.weight": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.65.gate_proj.weight_scale": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.65.up_proj.weight": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.65.up_proj.weight_scale": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.66.down_proj.weight": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.66.down_proj.weight_scale": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.66.gate_proj.weight": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.66.gate_proj.weight_scale": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.66.up_proj.weight": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.66.up_proj.weight_scale": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.67.down_proj.weight": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.67.down_proj.weight_scale": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.67.gate_proj.weight": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.67.gate_proj.weight_scale": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.67.up_proj.weight": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.67.up_proj.weight_scale": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.68.down_proj.weight": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.68.down_proj.weight_scale": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.68.gate_proj.weight": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.68.gate_proj.weight_scale": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.68.up_proj.weight": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.68.up_proj.weight_scale": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.69.down_proj.weight": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.69.down_proj.weight_scale": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.69.gate_proj.weight": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.69.gate_proj.weight_scale": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.69.up_proj.weight": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.69.up_proj.weight_scale": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.7.down_proj.weight": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.7.down_proj.weight_scale": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.7.gate_proj.weight": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.7.gate_proj.weight_scale": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.7.up_proj.weight": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.7.up_proj.weight_scale": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.70.down_proj.weight": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.70.down_proj.weight_scale": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.70.gate_proj.weight": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.70.gate_proj.weight_scale": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.70.up_proj.weight": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.70.up_proj.weight_scale": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.71.down_proj.weight": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.71.down_proj.weight_scale": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.71.gate_proj.weight": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.71.gate_proj.weight_scale": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.71.up_proj.weight": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.71.up_proj.weight_scale": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.72.down_proj.weight": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.72.down_proj.weight_scale": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.72.gate_proj.weight": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.72.gate_proj.weight_scale": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.72.up_proj.weight": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.72.up_proj.weight_scale": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.73.down_proj.weight": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.73.down_proj.weight_scale": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.73.gate_proj.weight": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.73.gate_proj.weight_scale": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.73.up_proj.weight": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.73.up_proj.weight_scale": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.74.down_proj.weight": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.74.down_proj.weight_scale": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.74.gate_proj.weight": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.74.gate_proj.weight_scale": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.74.up_proj.weight": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.74.up_proj.weight_scale": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.75.down_proj.weight": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.75.down_proj.weight_scale": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.75.gate_proj.weight": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.75.gate_proj.weight_scale": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.75.up_proj.weight": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.75.up_proj.weight_scale": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.76.down_proj.weight": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.76.down_proj.weight_scale": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.76.gate_proj.weight": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.76.gate_proj.weight_scale": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.76.up_proj.weight": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.76.up_proj.weight_scale": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.77.down_proj.weight": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.77.down_proj.weight_scale": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.77.gate_proj.weight": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.77.gate_proj.weight_scale": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.77.up_proj.weight": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.77.up_proj.weight_scale": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.78.down_proj.weight": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.78.down_proj.weight_scale": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.78.gate_proj.weight": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.78.gate_proj.weight_scale": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.78.up_proj.weight": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.78.up_proj.weight_scale": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.79.down_proj.weight": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.79.down_proj.weight_scale": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.79.gate_proj.weight": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.79.gate_proj.weight_scale": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.79.up_proj.weight": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.79.up_proj.weight_scale": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.8.down_proj.weight": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.8.down_proj.weight_scale": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.8.gate_proj.weight": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.8.gate_proj.weight_scale": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.8.up_proj.weight": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.8.up_proj.weight_scale": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.80.down_proj.weight": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.80.down_proj.weight_scale": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.80.gate_proj.weight": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.80.gate_proj.weight_scale": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.80.up_proj.weight": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.80.up_proj.weight_scale": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.81.down_proj.weight": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.81.down_proj.weight_scale": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.81.gate_proj.weight": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.81.gate_proj.weight_scale": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.81.up_proj.weight": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.81.up_proj.weight_scale": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.82.down_proj.weight": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.82.down_proj.weight_scale": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.82.gate_proj.weight": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.82.gate_proj.weight_scale": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.82.up_proj.weight": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.82.up_proj.weight_scale": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.83.down_proj.weight": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.83.down_proj.weight_scale": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.83.gate_proj.weight": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.83.gate_proj.weight_scale": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.83.up_proj.weight": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.83.up_proj.weight_scale": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.84.down_proj.weight": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.84.down_proj.weight_scale": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.84.gate_proj.weight": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.84.gate_proj.weight_scale": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.84.up_proj.weight": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.84.up_proj.weight_scale": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.85.down_proj.weight": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.85.down_proj.weight_scale": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.85.gate_proj.weight": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.85.gate_proj.weight_scale": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.85.up_proj.weight": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.85.up_proj.weight_scale": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.86.down_proj.weight": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.86.down_proj.weight_scale": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.86.gate_proj.weight": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.86.gate_proj.weight_scale": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.86.up_proj.weight": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.86.up_proj.weight_scale": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.87.down_proj.weight": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.87.down_proj.weight_scale": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.87.gate_proj.weight": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.87.gate_proj.weight_scale": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.87.up_proj.weight": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.87.up_proj.weight_scale": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.88.down_proj.weight": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.88.down_proj.weight_scale": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.88.gate_proj.weight": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.88.gate_proj.weight_scale": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.88.up_proj.weight": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.88.up_proj.weight_scale": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.89.down_proj.weight": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.89.down_proj.weight_scale": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.89.gate_proj.weight": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.89.gate_proj.weight_scale": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.89.up_proj.weight": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.89.up_proj.weight_scale": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.9.down_proj.weight": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.9.down_proj.weight_scale": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.9.gate_proj.weight": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.9.gate_proj.weight_scale": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.9.up_proj.weight": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.9.up_proj.weight_scale": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.90.down_proj.weight": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.90.down_proj.weight_scale": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.90.gate_proj.weight": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.90.gate_proj.weight_scale": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.90.up_proj.weight": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.90.up_proj.weight_scale": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.91.down_proj.weight": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.91.down_proj.weight_scale": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.91.gate_proj.weight": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.91.gate_proj.weight_scale": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.91.up_proj.weight": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.91.up_proj.weight_scale": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.92.down_proj.weight": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.92.down_proj.weight_scale": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.92.gate_proj.weight": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.92.gate_proj.weight_scale": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.92.up_proj.weight": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.92.up_proj.weight_scale": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.93.down_proj.weight": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.93.down_proj.weight_scale": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.93.gate_proj.weight": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.93.gate_proj.weight_scale": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.93.up_proj.weight": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.93.up_proj.weight_scale": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.94.down_proj.weight": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.94.down_proj.weight_scale": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.94.gate_proj.weight": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.94.gate_proj.weight_scale": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.94.up_proj.weight": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.94.up_proj.weight_scale": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.95.down_proj.weight": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.95.down_proj.weight_scale": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.95.gate_proj.weight": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.95.gate_proj.weight_scale": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.95.up_proj.weight": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.95.up_proj.weight_scale": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.96.down_proj.weight": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.96.down_proj.weight_scale": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.96.gate_proj.weight": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.96.gate_proj.weight_scale": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.96.up_proj.weight": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.96.up_proj.weight_scale": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.97.down_proj.weight": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.97.down_proj.weight_scale": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.97.gate_proj.weight": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.97.gate_proj.weight_scale": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.97.up_proj.weight": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.97.up_proj.weight_scale": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.98.down_proj.weight": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.98.down_proj.weight_scale": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.98.gate_proj.weight": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.98.gate_proj.weight_scale": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.98.up_proj.weight": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.98.up_proj.weight_scale": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.99.down_proj.weight": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.99.down_proj.weight_scale": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.99.gate_proj.weight": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.99.gate_proj.weight_scale": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.99.up_proj.weight": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.99.up_proj.weight_scale": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.gate.e_score_correction_bias": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.gate.weight": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.shared_experts.down_proj.weight": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.shared_experts.down_proj.weight_scale": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.shared_experts.gate_proj.weight": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.shared_experts.gate_proj.weight_scale": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.shared_experts.up_proj.weight": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.shared_experts.up_proj.weight_scale": "model-00038-of-00092.safetensors",
+ "model.layers.37.post_attention_layernorm.weight": "model-00038-of-00092.safetensors",
+ "model.layers.37.self_attn.k_norm.weight": "model-00038-of-00092.safetensors",
+ "model.layers.37.self_attn.k_proj.bias": "model-00038-of-00092.safetensors",
+ "model.layers.37.self_attn.k_proj.weight": "model-00038-of-00092.safetensors",
+ "model.layers.37.self_attn.k_proj.weight_scale": "model-00038-of-00092.safetensors",
+ "model.layers.37.self_attn.o_proj.weight": "model-00038-of-00092.safetensors",
+ "model.layers.37.self_attn.o_proj.weight_scale": "model-00038-of-00092.safetensors",
+ "model.layers.37.self_attn.q_norm.weight": "model-00038-of-00092.safetensors",
+ "model.layers.37.self_attn.q_proj.bias": "model-00038-of-00092.safetensors",
+ "model.layers.37.self_attn.q_proj.weight": "model-00038-of-00092.safetensors",
+ "model.layers.37.self_attn.q_proj.weight_scale": "model-00038-of-00092.safetensors",
+ "model.layers.37.self_attn.v_proj.bias": "model-00038-of-00092.safetensors",
+ "model.layers.37.self_attn.v_proj.weight": "model-00038-of-00092.safetensors",
+ "model.layers.37.self_attn.v_proj.weight_scale": "model-00038-of-00092.safetensors",
+ "model.layers.38.input_layernorm.weight": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.0.down_proj.weight": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.0.down_proj.weight_scale": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.0.gate_proj.weight": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.0.gate_proj.weight_scale": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.0.up_proj.weight": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.0.up_proj.weight_scale": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.1.down_proj.weight": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.1.down_proj.weight_scale": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.1.gate_proj.weight": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.1.gate_proj.weight_scale": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.1.up_proj.weight": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.1.up_proj.weight_scale": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.10.down_proj.weight": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.10.down_proj.weight_scale": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.10.gate_proj.weight": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.10.gate_proj.weight_scale": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.10.up_proj.weight": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.10.up_proj.weight_scale": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.100.down_proj.weight": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.100.down_proj.weight_scale": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.100.gate_proj.weight": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.100.gate_proj.weight_scale": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.100.up_proj.weight": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.100.up_proj.weight_scale": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.101.down_proj.weight": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.101.down_proj.weight_scale": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.101.gate_proj.weight": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.101.gate_proj.weight_scale": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.101.up_proj.weight": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.101.up_proj.weight_scale": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.102.down_proj.weight": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.102.down_proj.weight_scale": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.102.gate_proj.weight": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.102.gate_proj.weight_scale": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.102.up_proj.weight": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.102.up_proj.weight_scale": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.103.down_proj.weight": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.103.down_proj.weight_scale": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.103.gate_proj.weight": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.103.gate_proj.weight_scale": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.103.up_proj.weight": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.103.up_proj.weight_scale": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.104.down_proj.weight": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.104.down_proj.weight_scale": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.104.gate_proj.weight": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.104.gate_proj.weight_scale": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.104.up_proj.weight": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.104.up_proj.weight_scale": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.105.down_proj.weight": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.105.down_proj.weight_scale": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.105.gate_proj.weight": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.105.gate_proj.weight_scale": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.105.up_proj.weight": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.105.up_proj.weight_scale": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.106.down_proj.weight": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.106.down_proj.weight_scale": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.106.gate_proj.weight": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.106.gate_proj.weight_scale": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.106.up_proj.weight": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.106.up_proj.weight_scale": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.107.down_proj.weight": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.107.down_proj.weight_scale": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.107.gate_proj.weight": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.107.gate_proj.weight_scale": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.107.up_proj.weight": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.107.up_proj.weight_scale": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.108.down_proj.weight": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.108.down_proj.weight_scale": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.108.gate_proj.weight": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.108.gate_proj.weight_scale": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.108.up_proj.weight": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.108.up_proj.weight_scale": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.109.down_proj.weight": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.109.down_proj.weight_scale": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.109.gate_proj.weight": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.109.gate_proj.weight_scale": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.109.up_proj.weight": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.109.up_proj.weight_scale": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.11.down_proj.weight": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.11.down_proj.weight_scale": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.11.gate_proj.weight": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.11.gate_proj.weight_scale": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.11.up_proj.weight": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.11.up_proj.weight_scale": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.110.down_proj.weight": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.110.down_proj.weight_scale": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.110.gate_proj.weight": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.110.gate_proj.weight_scale": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.110.up_proj.weight": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.110.up_proj.weight_scale": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.111.down_proj.weight": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.111.down_proj.weight_scale": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.111.gate_proj.weight": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.111.gate_proj.weight_scale": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.111.up_proj.weight": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.111.up_proj.weight_scale": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.112.down_proj.weight": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.112.down_proj.weight_scale": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.112.gate_proj.weight": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.112.gate_proj.weight_scale": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.112.up_proj.weight": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.112.up_proj.weight_scale": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.113.down_proj.weight": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.113.down_proj.weight_scale": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.113.gate_proj.weight": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.113.gate_proj.weight_scale": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.113.up_proj.weight": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.113.up_proj.weight_scale": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.114.down_proj.weight": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.114.down_proj.weight_scale": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.114.gate_proj.weight": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.114.gate_proj.weight_scale": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.114.up_proj.weight": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.114.up_proj.weight_scale": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.115.down_proj.weight": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.115.down_proj.weight_scale": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.115.gate_proj.weight": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.115.gate_proj.weight_scale": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.115.up_proj.weight": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.115.up_proj.weight_scale": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.116.down_proj.weight": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.116.down_proj.weight_scale": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.116.gate_proj.weight": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.116.gate_proj.weight_scale": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.116.up_proj.weight": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.116.up_proj.weight_scale": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.117.down_proj.weight": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.117.down_proj.weight_scale": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.117.gate_proj.weight": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.117.gate_proj.weight_scale": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.117.up_proj.weight": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.117.up_proj.weight_scale": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.118.down_proj.weight": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.118.down_proj.weight_scale": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.118.gate_proj.weight": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.118.gate_proj.weight_scale": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.118.up_proj.weight": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.118.up_proj.weight_scale": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.119.down_proj.weight": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.119.down_proj.weight_scale": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.119.gate_proj.weight": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.119.gate_proj.weight_scale": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.119.up_proj.weight": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.119.up_proj.weight_scale": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.12.down_proj.weight": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.12.down_proj.weight_scale": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.12.gate_proj.weight": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.12.gate_proj.weight_scale": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.12.up_proj.weight": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.12.up_proj.weight_scale": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.120.down_proj.weight": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.120.down_proj.weight_scale": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.120.gate_proj.weight": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.120.gate_proj.weight_scale": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.120.up_proj.weight": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.120.up_proj.weight_scale": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.121.down_proj.weight": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.121.down_proj.weight_scale": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.121.gate_proj.weight": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.121.gate_proj.weight_scale": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.121.up_proj.weight": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.121.up_proj.weight_scale": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.122.down_proj.weight": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.122.down_proj.weight_scale": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.122.gate_proj.weight": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.122.gate_proj.weight_scale": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.122.up_proj.weight": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.122.up_proj.weight_scale": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.123.down_proj.weight": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.123.down_proj.weight_scale": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.123.gate_proj.weight": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.123.gate_proj.weight_scale": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.123.up_proj.weight": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.123.up_proj.weight_scale": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.124.down_proj.weight": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.124.down_proj.weight_scale": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.124.gate_proj.weight": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.124.gate_proj.weight_scale": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.124.up_proj.weight": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.124.up_proj.weight_scale": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.125.down_proj.weight": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.125.down_proj.weight_scale": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.125.gate_proj.weight": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.125.gate_proj.weight_scale": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.125.up_proj.weight": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.125.up_proj.weight_scale": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.126.down_proj.weight": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.126.down_proj.weight_scale": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.126.gate_proj.weight": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.126.gate_proj.weight_scale": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.126.up_proj.weight": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.126.up_proj.weight_scale": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.127.down_proj.weight": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.127.down_proj.weight_scale": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.127.gate_proj.weight": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.127.gate_proj.weight_scale": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.127.up_proj.weight": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.127.up_proj.weight_scale": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.128.down_proj.weight": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.128.down_proj.weight_scale": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.128.gate_proj.weight": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.128.gate_proj.weight_scale": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.128.up_proj.weight": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.128.up_proj.weight_scale": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.129.down_proj.weight": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.129.down_proj.weight_scale": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.129.gate_proj.weight": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.129.gate_proj.weight_scale": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.129.up_proj.weight": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.129.up_proj.weight_scale": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.13.down_proj.weight": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.13.down_proj.weight_scale": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.13.gate_proj.weight": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.13.gate_proj.weight_scale": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.13.up_proj.weight": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.13.up_proj.weight_scale": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.130.down_proj.weight": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.130.down_proj.weight_scale": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.130.gate_proj.weight": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.130.gate_proj.weight_scale": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.130.up_proj.weight": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.130.up_proj.weight_scale": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.131.down_proj.weight": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.131.down_proj.weight_scale": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.131.gate_proj.weight": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.131.gate_proj.weight_scale": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.131.up_proj.weight": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.131.up_proj.weight_scale": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.132.down_proj.weight": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.132.down_proj.weight_scale": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.132.gate_proj.weight": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.132.gate_proj.weight_scale": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.132.up_proj.weight": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.132.up_proj.weight_scale": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.133.down_proj.weight": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.133.down_proj.weight_scale": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.133.gate_proj.weight": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.133.gate_proj.weight_scale": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.133.up_proj.weight": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.133.up_proj.weight_scale": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.134.down_proj.weight": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.134.down_proj.weight_scale": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.134.gate_proj.weight": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.134.gate_proj.weight_scale": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.134.up_proj.weight": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.134.up_proj.weight_scale": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.135.down_proj.weight": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.135.down_proj.weight_scale": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.135.gate_proj.weight": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.135.gate_proj.weight_scale": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.135.up_proj.weight": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.135.up_proj.weight_scale": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.136.down_proj.weight": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.136.down_proj.weight_scale": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.136.gate_proj.weight": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.136.gate_proj.weight_scale": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.136.up_proj.weight": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.136.up_proj.weight_scale": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.137.down_proj.weight": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.137.down_proj.weight_scale": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.137.gate_proj.weight": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.137.gate_proj.weight_scale": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.137.up_proj.weight": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.137.up_proj.weight_scale": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.138.down_proj.weight": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.138.down_proj.weight_scale": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.138.gate_proj.weight": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.138.gate_proj.weight_scale": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.138.up_proj.weight": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.138.up_proj.weight_scale": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.139.down_proj.weight": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.139.down_proj.weight_scale": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.139.gate_proj.weight": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.139.gate_proj.weight_scale": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.139.up_proj.weight": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.139.up_proj.weight_scale": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.14.down_proj.weight": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.14.down_proj.weight_scale": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.14.gate_proj.weight": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.14.gate_proj.weight_scale": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.14.up_proj.weight": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.14.up_proj.weight_scale": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.140.down_proj.weight": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.140.down_proj.weight_scale": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.140.gate_proj.weight": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.140.gate_proj.weight_scale": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.140.up_proj.weight": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.140.up_proj.weight_scale": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.141.down_proj.weight": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.141.down_proj.weight_scale": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.141.gate_proj.weight": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.141.gate_proj.weight_scale": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.141.up_proj.weight": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.141.up_proj.weight_scale": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.142.down_proj.weight": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.142.down_proj.weight_scale": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.142.gate_proj.weight": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.142.gate_proj.weight_scale": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.142.up_proj.weight": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.142.up_proj.weight_scale": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.143.down_proj.weight": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.143.down_proj.weight_scale": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.143.gate_proj.weight": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.143.gate_proj.weight_scale": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.143.up_proj.weight": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.143.up_proj.weight_scale": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.144.down_proj.weight": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.144.down_proj.weight_scale": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.144.gate_proj.weight": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.144.gate_proj.weight_scale": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.144.up_proj.weight": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.144.up_proj.weight_scale": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.145.down_proj.weight": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.145.down_proj.weight_scale": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.145.gate_proj.weight": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.145.gate_proj.weight_scale": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.145.up_proj.weight": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.145.up_proj.weight_scale": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.146.down_proj.weight": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.146.down_proj.weight_scale": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.146.gate_proj.weight": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.146.gate_proj.weight_scale": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.146.up_proj.weight": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.146.up_proj.weight_scale": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.147.down_proj.weight": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.147.down_proj.weight_scale": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.147.gate_proj.weight": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.147.gate_proj.weight_scale": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.147.up_proj.weight": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.147.up_proj.weight_scale": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.148.down_proj.weight": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.148.down_proj.weight_scale": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.148.gate_proj.weight": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.148.gate_proj.weight_scale": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.148.up_proj.weight": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.148.up_proj.weight_scale": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.149.down_proj.weight": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.149.down_proj.weight_scale": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.149.gate_proj.weight": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.149.gate_proj.weight_scale": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.149.up_proj.weight": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.149.up_proj.weight_scale": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.15.down_proj.weight": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.15.down_proj.weight_scale": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.15.gate_proj.weight": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.15.gate_proj.weight_scale": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.15.up_proj.weight": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.15.up_proj.weight_scale": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.150.down_proj.weight": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.150.down_proj.weight_scale": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.150.gate_proj.weight": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.150.gate_proj.weight_scale": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.150.up_proj.weight": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.150.up_proj.weight_scale": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.151.down_proj.weight": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.151.down_proj.weight_scale": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.151.gate_proj.weight": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.151.gate_proj.weight_scale": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.151.up_proj.weight": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.151.up_proj.weight_scale": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.152.down_proj.weight": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.152.down_proj.weight_scale": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.152.gate_proj.weight": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.152.gate_proj.weight_scale": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.152.up_proj.weight": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.152.up_proj.weight_scale": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.153.down_proj.weight": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.153.down_proj.weight_scale": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.153.gate_proj.weight": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.153.gate_proj.weight_scale": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.153.up_proj.weight": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.153.up_proj.weight_scale": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.154.down_proj.weight": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.154.down_proj.weight_scale": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.154.gate_proj.weight": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.154.gate_proj.weight_scale": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.154.up_proj.weight": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.154.up_proj.weight_scale": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.155.down_proj.weight": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.155.down_proj.weight_scale": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.155.gate_proj.weight": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.155.gate_proj.weight_scale": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.155.up_proj.weight": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.155.up_proj.weight_scale": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.156.down_proj.weight": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.156.down_proj.weight_scale": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.156.gate_proj.weight": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.156.gate_proj.weight_scale": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.156.up_proj.weight": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.156.up_proj.weight_scale": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.157.down_proj.weight": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.157.down_proj.weight_scale": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.157.gate_proj.weight": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.157.gate_proj.weight_scale": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.157.up_proj.weight": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.157.up_proj.weight_scale": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.158.down_proj.weight": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.158.down_proj.weight_scale": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.158.gate_proj.weight": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.158.gate_proj.weight_scale": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.158.up_proj.weight": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.158.up_proj.weight_scale": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.159.down_proj.weight": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.159.down_proj.weight_scale": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.159.gate_proj.weight": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.159.gate_proj.weight_scale": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.159.up_proj.weight": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.159.up_proj.weight_scale": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.16.down_proj.weight": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.16.down_proj.weight_scale": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.16.gate_proj.weight": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.16.gate_proj.weight_scale": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.16.up_proj.weight": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.16.up_proj.weight_scale": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.17.down_proj.weight": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.17.down_proj.weight_scale": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.17.gate_proj.weight": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.17.gate_proj.weight_scale": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.17.up_proj.weight": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.17.up_proj.weight_scale": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.18.down_proj.weight": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.18.down_proj.weight_scale": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.18.gate_proj.weight": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.18.gate_proj.weight_scale": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.18.up_proj.weight": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.18.up_proj.weight_scale": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.19.down_proj.weight": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.19.down_proj.weight_scale": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.19.gate_proj.weight": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.19.gate_proj.weight_scale": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.19.up_proj.weight": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.19.up_proj.weight_scale": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.2.down_proj.weight": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.2.down_proj.weight_scale": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.2.gate_proj.weight": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.2.gate_proj.weight_scale": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.2.up_proj.weight": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.2.up_proj.weight_scale": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.20.down_proj.weight": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.20.down_proj.weight_scale": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.20.gate_proj.weight": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.20.gate_proj.weight_scale": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.20.up_proj.weight": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.20.up_proj.weight_scale": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.21.down_proj.weight": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.21.down_proj.weight_scale": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.21.gate_proj.weight": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.21.gate_proj.weight_scale": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.21.up_proj.weight": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.21.up_proj.weight_scale": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.22.down_proj.weight": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.22.down_proj.weight_scale": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.22.gate_proj.weight": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.22.gate_proj.weight_scale": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.22.up_proj.weight": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.22.up_proj.weight_scale": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.23.down_proj.weight": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.23.down_proj.weight_scale": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.23.gate_proj.weight": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.23.gate_proj.weight_scale": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.23.up_proj.weight": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.23.up_proj.weight_scale": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.24.down_proj.weight": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.24.down_proj.weight_scale": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.24.gate_proj.weight": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.24.gate_proj.weight_scale": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.24.up_proj.weight": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.24.up_proj.weight_scale": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.25.down_proj.weight": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.25.down_proj.weight_scale": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.25.gate_proj.weight": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.25.gate_proj.weight_scale": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.25.up_proj.weight": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.25.up_proj.weight_scale": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.26.down_proj.weight": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.26.down_proj.weight_scale": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.26.gate_proj.weight": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.26.gate_proj.weight_scale": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.26.up_proj.weight": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.26.up_proj.weight_scale": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.27.down_proj.weight": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.27.down_proj.weight_scale": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.27.gate_proj.weight": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.27.gate_proj.weight_scale": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.27.up_proj.weight": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.27.up_proj.weight_scale": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.28.down_proj.weight": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.28.down_proj.weight_scale": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.28.gate_proj.weight": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.28.gate_proj.weight_scale": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.28.up_proj.weight": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.28.up_proj.weight_scale": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.29.down_proj.weight": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.29.down_proj.weight_scale": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.29.gate_proj.weight": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.29.gate_proj.weight_scale": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.29.up_proj.weight": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.29.up_proj.weight_scale": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.3.down_proj.weight": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.3.down_proj.weight_scale": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.3.gate_proj.weight": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.3.gate_proj.weight_scale": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.3.up_proj.weight": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.3.up_proj.weight_scale": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.30.down_proj.weight": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.30.down_proj.weight_scale": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.30.gate_proj.weight": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.30.gate_proj.weight_scale": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.30.up_proj.weight": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.30.up_proj.weight_scale": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.31.down_proj.weight": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.31.down_proj.weight_scale": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.31.gate_proj.weight": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.31.gate_proj.weight_scale": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.31.up_proj.weight": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.31.up_proj.weight_scale": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.32.down_proj.weight": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.32.down_proj.weight_scale": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.32.gate_proj.weight": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.32.gate_proj.weight_scale": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.32.up_proj.weight": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.32.up_proj.weight_scale": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.33.down_proj.weight": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.33.down_proj.weight_scale": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.33.gate_proj.weight": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.33.gate_proj.weight_scale": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.33.up_proj.weight": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.33.up_proj.weight_scale": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.34.down_proj.weight": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.34.down_proj.weight_scale": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.34.gate_proj.weight": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.34.gate_proj.weight_scale": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.34.up_proj.weight": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.34.up_proj.weight_scale": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.35.down_proj.weight": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.35.down_proj.weight_scale": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.35.gate_proj.weight": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.35.gate_proj.weight_scale": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.35.up_proj.weight": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.35.up_proj.weight_scale": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.36.down_proj.weight": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.36.down_proj.weight_scale": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.36.gate_proj.weight": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.36.gate_proj.weight_scale": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.36.up_proj.weight": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.36.up_proj.weight_scale": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.37.down_proj.weight": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.37.down_proj.weight_scale": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.37.gate_proj.weight": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.37.gate_proj.weight_scale": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.37.up_proj.weight": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.37.up_proj.weight_scale": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.38.down_proj.weight": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.38.down_proj.weight_scale": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.38.gate_proj.weight": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.38.gate_proj.weight_scale": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.38.up_proj.weight": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.38.up_proj.weight_scale": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.39.down_proj.weight": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.39.down_proj.weight_scale": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.39.gate_proj.weight": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.39.gate_proj.weight_scale": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.39.up_proj.weight": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.39.up_proj.weight_scale": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.4.down_proj.weight": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.4.down_proj.weight_scale": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.4.gate_proj.weight": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.4.gate_proj.weight_scale": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.4.up_proj.weight": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.4.up_proj.weight_scale": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.40.down_proj.weight": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.40.down_proj.weight_scale": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.40.gate_proj.weight": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.40.gate_proj.weight_scale": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.40.up_proj.weight": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.40.up_proj.weight_scale": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.41.down_proj.weight": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.41.down_proj.weight_scale": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.41.gate_proj.weight": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.41.gate_proj.weight_scale": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.41.up_proj.weight": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.41.up_proj.weight_scale": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.42.down_proj.weight": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.42.down_proj.weight_scale": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.42.gate_proj.weight": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.42.gate_proj.weight_scale": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.42.up_proj.weight": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.42.up_proj.weight_scale": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.43.down_proj.weight": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.43.down_proj.weight_scale": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.43.gate_proj.weight": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.43.gate_proj.weight_scale": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.43.up_proj.weight": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.43.up_proj.weight_scale": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.44.down_proj.weight": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.44.down_proj.weight_scale": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.44.gate_proj.weight": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.44.gate_proj.weight_scale": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.44.up_proj.weight": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.44.up_proj.weight_scale": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.45.down_proj.weight": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.45.down_proj.weight_scale": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.45.gate_proj.weight": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.45.gate_proj.weight_scale": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.45.up_proj.weight": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.45.up_proj.weight_scale": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.46.down_proj.weight": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.46.down_proj.weight_scale": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.46.gate_proj.weight": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.46.gate_proj.weight_scale": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.46.up_proj.weight": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.46.up_proj.weight_scale": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.47.down_proj.weight": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.47.down_proj.weight_scale": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.47.gate_proj.weight": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.47.gate_proj.weight_scale": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.47.up_proj.weight": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.47.up_proj.weight_scale": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.48.down_proj.weight": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.48.down_proj.weight_scale": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.48.gate_proj.weight": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.48.gate_proj.weight_scale": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.48.up_proj.weight": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.48.up_proj.weight_scale": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.49.down_proj.weight": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.49.down_proj.weight_scale": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.49.gate_proj.weight": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.49.gate_proj.weight_scale": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.49.up_proj.weight": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.49.up_proj.weight_scale": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.5.down_proj.weight": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.5.down_proj.weight_scale": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.5.gate_proj.weight": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.5.gate_proj.weight_scale": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.5.up_proj.weight": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.5.up_proj.weight_scale": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.50.down_proj.weight": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.50.down_proj.weight_scale": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.50.gate_proj.weight": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.50.gate_proj.weight_scale": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.50.up_proj.weight": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.50.up_proj.weight_scale": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.51.down_proj.weight": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.51.down_proj.weight_scale": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.51.gate_proj.weight": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.51.gate_proj.weight_scale": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.51.up_proj.weight": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.51.up_proj.weight_scale": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.52.down_proj.weight": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.52.down_proj.weight_scale": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.52.gate_proj.weight": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.52.gate_proj.weight_scale": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.52.up_proj.weight": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.52.up_proj.weight_scale": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.53.down_proj.weight": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.53.down_proj.weight_scale": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.53.gate_proj.weight": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.53.gate_proj.weight_scale": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.53.up_proj.weight": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.53.up_proj.weight_scale": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.54.down_proj.weight": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.54.down_proj.weight_scale": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.54.gate_proj.weight": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.54.gate_proj.weight_scale": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.54.up_proj.weight": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.54.up_proj.weight_scale": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.55.down_proj.weight": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.55.down_proj.weight_scale": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.55.gate_proj.weight": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.55.gate_proj.weight_scale": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.55.up_proj.weight": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.55.up_proj.weight_scale": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.56.down_proj.weight": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.56.down_proj.weight_scale": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.56.gate_proj.weight": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.56.gate_proj.weight_scale": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.56.up_proj.weight": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.56.up_proj.weight_scale": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.57.down_proj.weight": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.57.down_proj.weight_scale": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.57.gate_proj.weight": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.57.gate_proj.weight_scale": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.57.up_proj.weight": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.57.up_proj.weight_scale": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.58.down_proj.weight": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.58.down_proj.weight_scale": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.58.gate_proj.weight": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.58.gate_proj.weight_scale": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.58.up_proj.weight": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.58.up_proj.weight_scale": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.59.down_proj.weight": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.59.down_proj.weight_scale": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.59.gate_proj.weight": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.59.gate_proj.weight_scale": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.59.up_proj.weight": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.59.up_proj.weight_scale": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.6.down_proj.weight": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.6.down_proj.weight_scale": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.6.gate_proj.weight": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.6.gate_proj.weight_scale": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.6.up_proj.weight": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.6.up_proj.weight_scale": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.60.down_proj.weight": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.60.down_proj.weight_scale": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.60.gate_proj.weight": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.60.gate_proj.weight_scale": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.60.up_proj.weight": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.60.up_proj.weight_scale": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.61.down_proj.weight": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.61.down_proj.weight_scale": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.61.gate_proj.weight": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.61.gate_proj.weight_scale": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.61.up_proj.weight": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.61.up_proj.weight_scale": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.62.down_proj.weight": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.62.down_proj.weight_scale": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.62.gate_proj.weight": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.62.gate_proj.weight_scale": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.62.up_proj.weight": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.62.up_proj.weight_scale": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.63.down_proj.weight": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.63.down_proj.weight_scale": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.63.gate_proj.weight": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.63.gate_proj.weight_scale": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.63.up_proj.weight": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.63.up_proj.weight_scale": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.64.down_proj.weight": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.64.down_proj.weight_scale": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.64.gate_proj.weight": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.64.gate_proj.weight_scale": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.64.up_proj.weight": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.64.up_proj.weight_scale": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.65.down_proj.weight": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.65.down_proj.weight_scale": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.65.gate_proj.weight": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.65.gate_proj.weight_scale": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.65.up_proj.weight": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.65.up_proj.weight_scale": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.66.down_proj.weight": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.66.down_proj.weight_scale": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.66.gate_proj.weight": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.66.gate_proj.weight_scale": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.66.up_proj.weight": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.66.up_proj.weight_scale": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.67.down_proj.weight": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.67.down_proj.weight_scale": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.67.gate_proj.weight": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.67.gate_proj.weight_scale": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.67.up_proj.weight": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.67.up_proj.weight_scale": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.68.down_proj.weight": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.68.down_proj.weight_scale": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.68.gate_proj.weight": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.68.gate_proj.weight_scale": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.68.up_proj.weight": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.68.up_proj.weight_scale": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.69.down_proj.weight": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.69.down_proj.weight_scale": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.69.gate_proj.weight": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.69.gate_proj.weight_scale": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.69.up_proj.weight": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.69.up_proj.weight_scale": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.7.down_proj.weight": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.7.down_proj.weight_scale": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.7.gate_proj.weight": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.7.gate_proj.weight_scale": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.7.up_proj.weight": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.7.up_proj.weight_scale": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.70.down_proj.weight": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.70.down_proj.weight_scale": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.70.gate_proj.weight": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.70.gate_proj.weight_scale": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.70.up_proj.weight": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.70.up_proj.weight_scale": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.71.down_proj.weight": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.71.down_proj.weight_scale": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.71.gate_proj.weight": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.71.gate_proj.weight_scale": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.71.up_proj.weight": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.71.up_proj.weight_scale": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.72.down_proj.weight": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.72.down_proj.weight_scale": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.72.gate_proj.weight": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.72.gate_proj.weight_scale": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.72.up_proj.weight": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.72.up_proj.weight_scale": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.73.down_proj.weight": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.73.down_proj.weight_scale": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.73.gate_proj.weight": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.73.gate_proj.weight_scale": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.73.up_proj.weight": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.73.up_proj.weight_scale": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.74.down_proj.weight": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.74.down_proj.weight_scale": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.74.gate_proj.weight": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.74.gate_proj.weight_scale": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.74.up_proj.weight": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.74.up_proj.weight_scale": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.75.down_proj.weight": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.75.down_proj.weight_scale": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.75.gate_proj.weight": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.75.gate_proj.weight_scale": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.75.up_proj.weight": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.75.up_proj.weight_scale": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.76.down_proj.weight": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.76.down_proj.weight_scale": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.76.gate_proj.weight": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.76.gate_proj.weight_scale": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.76.up_proj.weight": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.76.up_proj.weight_scale": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.77.down_proj.weight": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.77.down_proj.weight_scale": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.77.gate_proj.weight": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.77.gate_proj.weight_scale": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.77.up_proj.weight": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.77.up_proj.weight_scale": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.78.down_proj.weight": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.78.down_proj.weight_scale": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.78.gate_proj.weight": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.78.gate_proj.weight_scale": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.78.up_proj.weight": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.78.up_proj.weight_scale": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.79.down_proj.weight": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.79.down_proj.weight_scale": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.79.gate_proj.weight": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.79.gate_proj.weight_scale": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.79.up_proj.weight": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.79.up_proj.weight_scale": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.8.down_proj.weight": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.8.down_proj.weight_scale": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.8.gate_proj.weight": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.8.gate_proj.weight_scale": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.8.up_proj.weight": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.8.up_proj.weight_scale": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.80.down_proj.weight": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.80.down_proj.weight_scale": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.80.gate_proj.weight": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.80.gate_proj.weight_scale": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.80.up_proj.weight": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.80.up_proj.weight_scale": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.81.down_proj.weight": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.81.down_proj.weight_scale": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.81.gate_proj.weight": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.81.gate_proj.weight_scale": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.81.up_proj.weight": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.81.up_proj.weight_scale": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.82.down_proj.weight": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.82.down_proj.weight_scale": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.82.gate_proj.weight": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.82.gate_proj.weight_scale": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.82.up_proj.weight": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.82.up_proj.weight_scale": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.83.down_proj.weight": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.83.down_proj.weight_scale": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.83.gate_proj.weight": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.83.gate_proj.weight_scale": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.83.up_proj.weight": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.83.up_proj.weight_scale": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.84.down_proj.weight": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.84.down_proj.weight_scale": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.84.gate_proj.weight": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.84.gate_proj.weight_scale": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.84.up_proj.weight": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.84.up_proj.weight_scale": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.85.down_proj.weight": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.85.down_proj.weight_scale": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.85.gate_proj.weight": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.85.gate_proj.weight_scale": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.85.up_proj.weight": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.85.up_proj.weight_scale": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.86.down_proj.weight": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.86.down_proj.weight_scale": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.86.gate_proj.weight": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.86.gate_proj.weight_scale": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.86.up_proj.weight": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.86.up_proj.weight_scale": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.87.down_proj.weight": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.87.down_proj.weight_scale": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.87.gate_proj.weight": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.87.gate_proj.weight_scale": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.87.up_proj.weight": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.87.up_proj.weight_scale": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.88.down_proj.weight": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.88.down_proj.weight_scale": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.88.gate_proj.weight": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.88.gate_proj.weight_scale": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.88.up_proj.weight": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.88.up_proj.weight_scale": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.89.down_proj.weight": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.89.down_proj.weight_scale": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.89.gate_proj.weight": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.89.gate_proj.weight_scale": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.89.up_proj.weight": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.89.up_proj.weight_scale": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.9.down_proj.weight": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.9.down_proj.weight_scale": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.9.gate_proj.weight": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.9.gate_proj.weight_scale": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.9.up_proj.weight": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.9.up_proj.weight_scale": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.90.down_proj.weight": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.90.down_proj.weight_scale": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.90.gate_proj.weight": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.90.gate_proj.weight_scale": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.90.up_proj.weight": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.90.up_proj.weight_scale": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.91.down_proj.weight": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.91.down_proj.weight_scale": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.91.gate_proj.weight": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.91.gate_proj.weight_scale": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.91.up_proj.weight": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.91.up_proj.weight_scale": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.92.down_proj.weight": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.92.down_proj.weight_scale": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.92.gate_proj.weight": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.92.gate_proj.weight_scale": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.92.up_proj.weight": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.92.up_proj.weight_scale": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.93.down_proj.weight": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.93.down_proj.weight_scale": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.93.gate_proj.weight": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.93.gate_proj.weight_scale": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.93.up_proj.weight": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.93.up_proj.weight_scale": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.94.down_proj.weight": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.94.down_proj.weight_scale": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.94.gate_proj.weight": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.94.gate_proj.weight_scale": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.94.up_proj.weight": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.94.up_proj.weight_scale": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.95.down_proj.weight": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.95.down_proj.weight_scale": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.95.gate_proj.weight": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.95.gate_proj.weight_scale": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.95.up_proj.weight": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.95.up_proj.weight_scale": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.96.down_proj.weight": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.96.down_proj.weight_scale": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.96.gate_proj.weight": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.96.gate_proj.weight_scale": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.96.up_proj.weight": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.96.up_proj.weight_scale": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.97.down_proj.weight": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.97.down_proj.weight_scale": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.97.gate_proj.weight": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.97.gate_proj.weight_scale": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.97.up_proj.weight": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.97.up_proj.weight_scale": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.98.down_proj.weight": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.98.down_proj.weight_scale": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.98.gate_proj.weight": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.98.gate_proj.weight_scale": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.98.up_proj.weight": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.98.up_proj.weight_scale": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.99.down_proj.weight": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.99.down_proj.weight_scale": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.99.gate_proj.weight": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.99.gate_proj.weight_scale": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.99.up_proj.weight": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.99.up_proj.weight_scale": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.gate.e_score_correction_bias": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.gate.weight": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.shared_experts.down_proj.weight": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.shared_experts.down_proj.weight_scale": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.shared_experts.gate_proj.weight": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.shared_experts.gate_proj.weight_scale": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.shared_experts.up_proj.weight": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.shared_experts.up_proj.weight_scale": "model-00039-of-00092.safetensors",
+ "model.layers.38.post_attention_layernorm.weight": "model-00039-of-00092.safetensors",
+ "model.layers.38.self_attn.k_norm.weight": "model-00039-of-00092.safetensors",
+ "model.layers.38.self_attn.k_proj.bias": "model-00039-of-00092.safetensors",
+ "model.layers.38.self_attn.k_proj.weight": "model-00039-of-00092.safetensors",
+ "model.layers.38.self_attn.k_proj.weight_scale": "model-00039-of-00092.safetensors",
+ "model.layers.38.self_attn.o_proj.weight": "model-00039-of-00092.safetensors",
+ "model.layers.38.self_attn.o_proj.weight_scale": "model-00039-of-00092.safetensors",
+ "model.layers.38.self_attn.q_norm.weight": "model-00039-of-00092.safetensors",
+ "model.layers.38.self_attn.q_proj.bias": "model-00039-of-00092.safetensors",
+ "model.layers.38.self_attn.q_proj.weight": "model-00039-of-00092.safetensors",
+ "model.layers.38.self_attn.q_proj.weight_scale": "model-00039-of-00092.safetensors",
+ "model.layers.38.self_attn.v_proj.bias": "model-00039-of-00092.safetensors",
+ "model.layers.38.self_attn.v_proj.weight": "model-00039-of-00092.safetensors",
+ "model.layers.38.self_attn.v_proj.weight_scale": "model-00039-of-00092.safetensors",
+ "model.layers.39.input_layernorm.weight": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.0.down_proj.weight": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.0.down_proj.weight_scale": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.0.gate_proj.weight": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.0.gate_proj.weight_scale": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.0.up_proj.weight": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.0.up_proj.weight_scale": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.1.down_proj.weight": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.1.down_proj.weight_scale": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.1.gate_proj.weight": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.1.gate_proj.weight_scale": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.1.up_proj.weight": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.1.up_proj.weight_scale": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.10.down_proj.weight": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.10.down_proj.weight_scale": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.10.gate_proj.weight": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.10.gate_proj.weight_scale": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.10.up_proj.weight": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.10.up_proj.weight_scale": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.100.down_proj.weight": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.100.down_proj.weight_scale": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.100.gate_proj.weight": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.100.gate_proj.weight_scale": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.100.up_proj.weight": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.100.up_proj.weight_scale": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.101.down_proj.weight": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.101.down_proj.weight_scale": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.101.gate_proj.weight": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.101.gate_proj.weight_scale": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.101.up_proj.weight": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.101.up_proj.weight_scale": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.102.down_proj.weight": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.102.down_proj.weight_scale": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.102.gate_proj.weight": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.102.gate_proj.weight_scale": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.102.up_proj.weight": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.102.up_proj.weight_scale": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.103.down_proj.weight": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.103.down_proj.weight_scale": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.103.gate_proj.weight": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.103.gate_proj.weight_scale": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.103.up_proj.weight": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.103.up_proj.weight_scale": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.104.down_proj.weight": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.104.down_proj.weight_scale": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.104.gate_proj.weight": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.104.gate_proj.weight_scale": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.104.up_proj.weight": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.104.up_proj.weight_scale": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.105.down_proj.weight": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.105.down_proj.weight_scale": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.105.gate_proj.weight": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.105.gate_proj.weight_scale": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.105.up_proj.weight": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.105.up_proj.weight_scale": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.106.down_proj.weight": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.106.down_proj.weight_scale": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.106.gate_proj.weight": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.106.gate_proj.weight_scale": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.106.up_proj.weight": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.106.up_proj.weight_scale": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.107.down_proj.weight": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.107.down_proj.weight_scale": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.107.gate_proj.weight": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.107.gate_proj.weight_scale": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.107.up_proj.weight": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.107.up_proj.weight_scale": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.108.down_proj.weight": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.108.down_proj.weight_scale": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.108.gate_proj.weight": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.108.gate_proj.weight_scale": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.108.up_proj.weight": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.108.up_proj.weight_scale": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.109.down_proj.weight": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.109.down_proj.weight_scale": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.109.gate_proj.weight": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.109.gate_proj.weight_scale": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.109.up_proj.weight": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.109.up_proj.weight_scale": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.11.down_proj.weight": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.11.down_proj.weight_scale": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.11.gate_proj.weight": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.11.gate_proj.weight_scale": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.11.up_proj.weight": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.11.up_proj.weight_scale": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.110.down_proj.weight": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.110.down_proj.weight_scale": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.110.gate_proj.weight": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.110.gate_proj.weight_scale": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.110.up_proj.weight": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.110.up_proj.weight_scale": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.111.down_proj.weight": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.111.down_proj.weight_scale": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.111.gate_proj.weight": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.111.gate_proj.weight_scale": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.111.up_proj.weight": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.111.up_proj.weight_scale": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.112.down_proj.weight": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.112.down_proj.weight_scale": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.112.gate_proj.weight": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.112.gate_proj.weight_scale": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.112.up_proj.weight": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.112.up_proj.weight_scale": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.113.down_proj.weight": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.113.down_proj.weight_scale": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.113.gate_proj.weight": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.113.gate_proj.weight_scale": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.113.up_proj.weight": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.113.up_proj.weight_scale": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.114.down_proj.weight": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.114.down_proj.weight_scale": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.114.gate_proj.weight": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.114.gate_proj.weight_scale": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.114.up_proj.weight": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.114.up_proj.weight_scale": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.115.down_proj.weight": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.115.down_proj.weight_scale": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.115.gate_proj.weight": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.115.gate_proj.weight_scale": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.115.up_proj.weight": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.115.up_proj.weight_scale": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.116.down_proj.weight": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.116.down_proj.weight_scale": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.116.gate_proj.weight": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.116.gate_proj.weight_scale": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.116.up_proj.weight": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.116.up_proj.weight_scale": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.117.down_proj.weight": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.117.down_proj.weight_scale": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.117.gate_proj.weight": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.117.gate_proj.weight_scale": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.117.up_proj.weight": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.117.up_proj.weight_scale": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.118.down_proj.weight": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.118.down_proj.weight_scale": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.118.gate_proj.weight": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.118.gate_proj.weight_scale": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.118.up_proj.weight": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.118.up_proj.weight_scale": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.119.down_proj.weight": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.119.down_proj.weight_scale": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.119.gate_proj.weight": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.119.gate_proj.weight_scale": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.119.up_proj.weight": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.119.up_proj.weight_scale": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.12.down_proj.weight": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.12.down_proj.weight_scale": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.12.gate_proj.weight": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.12.gate_proj.weight_scale": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.12.up_proj.weight": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.12.up_proj.weight_scale": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.120.down_proj.weight": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.120.down_proj.weight_scale": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.120.gate_proj.weight": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.120.gate_proj.weight_scale": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.120.up_proj.weight": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.120.up_proj.weight_scale": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.121.down_proj.weight": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.121.down_proj.weight_scale": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.121.gate_proj.weight": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.121.gate_proj.weight_scale": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.121.up_proj.weight": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.121.up_proj.weight_scale": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.122.down_proj.weight": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.122.down_proj.weight_scale": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.122.gate_proj.weight": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.122.gate_proj.weight_scale": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.122.up_proj.weight": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.122.up_proj.weight_scale": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.123.down_proj.weight": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.123.down_proj.weight_scale": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.123.gate_proj.weight": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.123.gate_proj.weight_scale": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.123.up_proj.weight": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.123.up_proj.weight_scale": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.124.down_proj.weight": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.124.down_proj.weight_scale": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.124.gate_proj.weight": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.124.gate_proj.weight_scale": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.124.up_proj.weight": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.124.up_proj.weight_scale": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.125.down_proj.weight": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.125.down_proj.weight_scale": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.125.gate_proj.weight": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.125.gate_proj.weight_scale": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.125.up_proj.weight": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.125.up_proj.weight_scale": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.126.down_proj.weight": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.126.down_proj.weight_scale": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.126.gate_proj.weight": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.126.gate_proj.weight_scale": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.126.up_proj.weight": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.126.up_proj.weight_scale": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.127.down_proj.weight": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.127.down_proj.weight_scale": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.127.gate_proj.weight": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.127.gate_proj.weight_scale": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.127.up_proj.weight": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.127.up_proj.weight_scale": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.128.down_proj.weight": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.128.down_proj.weight_scale": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.128.gate_proj.weight": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.128.gate_proj.weight_scale": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.128.up_proj.weight": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.128.up_proj.weight_scale": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.129.down_proj.weight": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.129.down_proj.weight_scale": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.129.gate_proj.weight": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.129.gate_proj.weight_scale": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.129.up_proj.weight": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.129.up_proj.weight_scale": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.13.down_proj.weight": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.13.down_proj.weight_scale": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.13.gate_proj.weight": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.13.gate_proj.weight_scale": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.13.up_proj.weight": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.13.up_proj.weight_scale": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.130.down_proj.weight": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.130.down_proj.weight_scale": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.130.gate_proj.weight": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.130.gate_proj.weight_scale": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.130.up_proj.weight": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.130.up_proj.weight_scale": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.131.down_proj.weight": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.131.down_proj.weight_scale": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.131.gate_proj.weight": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.131.gate_proj.weight_scale": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.131.up_proj.weight": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.131.up_proj.weight_scale": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.132.down_proj.weight": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.132.down_proj.weight_scale": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.132.gate_proj.weight": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.132.gate_proj.weight_scale": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.132.up_proj.weight": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.132.up_proj.weight_scale": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.133.down_proj.weight": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.133.down_proj.weight_scale": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.133.gate_proj.weight": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.133.gate_proj.weight_scale": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.133.up_proj.weight": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.133.up_proj.weight_scale": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.134.down_proj.weight": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.134.down_proj.weight_scale": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.134.gate_proj.weight": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.134.gate_proj.weight_scale": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.134.up_proj.weight": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.134.up_proj.weight_scale": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.135.down_proj.weight": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.135.down_proj.weight_scale": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.135.gate_proj.weight": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.135.gate_proj.weight_scale": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.135.up_proj.weight": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.135.up_proj.weight_scale": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.136.down_proj.weight": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.136.down_proj.weight_scale": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.136.gate_proj.weight": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.136.gate_proj.weight_scale": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.136.up_proj.weight": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.136.up_proj.weight_scale": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.137.down_proj.weight": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.137.down_proj.weight_scale": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.137.gate_proj.weight": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.137.gate_proj.weight_scale": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.137.up_proj.weight": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.137.up_proj.weight_scale": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.138.down_proj.weight": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.138.down_proj.weight_scale": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.138.gate_proj.weight": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.138.gate_proj.weight_scale": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.138.up_proj.weight": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.138.up_proj.weight_scale": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.139.down_proj.weight": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.139.down_proj.weight_scale": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.139.gate_proj.weight": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.139.gate_proj.weight_scale": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.139.up_proj.weight": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.139.up_proj.weight_scale": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.14.down_proj.weight": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.14.down_proj.weight_scale": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.14.gate_proj.weight": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.14.gate_proj.weight_scale": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.14.up_proj.weight": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.14.up_proj.weight_scale": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.140.down_proj.weight": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.140.down_proj.weight_scale": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.140.gate_proj.weight": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.140.gate_proj.weight_scale": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.140.up_proj.weight": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.140.up_proj.weight_scale": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.141.down_proj.weight": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.141.down_proj.weight_scale": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.141.gate_proj.weight": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.141.gate_proj.weight_scale": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.141.up_proj.weight": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.141.up_proj.weight_scale": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.142.down_proj.weight": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.142.down_proj.weight_scale": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.142.gate_proj.weight": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.142.gate_proj.weight_scale": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.142.up_proj.weight": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.142.up_proj.weight_scale": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.143.down_proj.weight": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.143.down_proj.weight_scale": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.143.gate_proj.weight": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.143.gate_proj.weight_scale": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.143.up_proj.weight": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.143.up_proj.weight_scale": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.144.down_proj.weight": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.144.down_proj.weight_scale": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.144.gate_proj.weight": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.144.gate_proj.weight_scale": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.144.up_proj.weight": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.144.up_proj.weight_scale": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.145.down_proj.weight": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.145.down_proj.weight_scale": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.145.gate_proj.weight": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.145.gate_proj.weight_scale": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.145.up_proj.weight": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.145.up_proj.weight_scale": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.146.down_proj.weight": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.146.down_proj.weight_scale": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.146.gate_proj.weight": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.146.gate_proj.weight_scale": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.146.up_proj.weight": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.146.up_proj.weight_scale": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.147.down_proj.weight": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.147.down_proj.weight_scale": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.147.gate_proj.weight": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.147.gate_proj.weight_scale": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.147.up_proj.weight": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.147.up_proj.weight_scale": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.148.down_proj.weight": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.148.down_proj.weight_scale": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.148.gate_proj.weight": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.148.gate_proj.weight_scale": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.148.up_proj.weight": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.148.up_proj.weight_scale": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.149.down_proj.weight": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.149.down_proj.weight_scale": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.149.gate_proj.weight": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.149.gate_proj.weight_scale": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.149.up_proj.weight": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.149.up_proj.weight_scale": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.15.down_proj.weight": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.15.down_proj.weight_scale": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.15.gate_proj.weight": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.15.gate_proj.weight_scale": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.15.up_proj.weight": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.15.up_proj.weight_scale": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.150.down_proj.weight": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.150.down_proj.weight_scale": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.150.gate_proj.weight": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.150.gate_proj.weight_scale": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.150.up_proj.weight": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.150.up_proj.weight_scale": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.151.down_proj.weight": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.151.down_proj.weight_scale": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.151.gate_proj.weight": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.151.gate_proj.weight_scale": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.151.up_proj.weight": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.151.up_proj.weight_scale": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.152.down_proj.weight": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.152.down_proj.weight_scale": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.152.gate_proj.weight": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.152.gate_proj.weight_scale": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.152.up_proj.weight": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.152.up_proj.weight_scale": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.153.down_proj.weight": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.153.down_proj.weight_scale": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.153.gate_proj.weight": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.153.gate_proj.weight_scale": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.153.up_proj.weight": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.153.up_proj.weight_scale": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.154.down_proj.weight": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.154.down_proj.weight_scale": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.154.gate_proj.weight": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.154.gate_proj.weight_scale": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.154.up_proj.weight": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.154.up_proj.weight_scale": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.155.down_proj.weight": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.155.down_proj.weight_scale": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.155.gate_proj.weight": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.155.gate_proj.weight_scale": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.155.up_proj.weight": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.155.up_proj.weight_scale": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.156.down_proj.weight": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.156.down_proj.weight_scale": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.156.gate_proj.weight": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.156.gate_proj.weight_scale": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.156.up_proj.weight": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.156.up_proj.weight_scale": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.157.down_proj.weight": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.157.down_proj.weight_scale": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.157.gate_proj.weight": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.157.gate_proj.weight_scale": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.157.up_proj.weight": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.157.up_proj.weight_scale": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.158.down_proj.weight": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.158.down_proj.weight_scale": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.158.gate_proj.weight": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.158.gate_proj.weight_scale": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.158.up_proj.weight": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.158.up_proj.weight_scale": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.159.down_proj.weight": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.159.down_proj.weight_scale": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.159.gate_proj.weight": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.159.gate_proj.weight_scale": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.159.up_proj.weight": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.159.up_proj.weight_scale": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.16.down_proj.weight": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.16.down_proj.weight_scale": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.16.gate_proj.weight": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.16.gate_proj.weight_scale": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.16.up_proj.weight": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.16.up_proj.weight_scale": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.17.down_proj.weight": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.17.down_proj.weight_scale": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.17.gate_proj.weight": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.17.gate_proj.weight_scale": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.17.up_proj.weight": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.17.up_proj.weight_scale": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.18.down_proj.weight": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.18.down_proj.weight_scale": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.18.gate_proj.weight": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.18.gate_proj.weight_scale": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.18.up_proj.weight": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.18.up_proj.weight_scale": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.19.down_proj.weight": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.19.down_proj.weight_scale": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.19.gate_proj.weight": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.19.gate_proj.weight_scale": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.19.up_proj.weight": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.19.up_proj.weight_scale": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.2.down_proj.weight": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.2.down_proj.weight_scale": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.2.gate_proj.weight": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.2.gate_proj.weight_scale": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.2.up_proj.weight": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.2.up_proj.weight_scale": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.20.down_proj.weight": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.20.down_proj.weight_scale": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.20.gate_proj.weight": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.20.gate_proj.weight_scale": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.20.up_proj.weight": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.20.up_proj.weight_scale": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.21.down_proj.weight": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.21.down_proj.weight_scale": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.21.gate_proj.weight": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.21.gate_proj.weight_scale": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.21.up_proj.weight": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.21.up_proj.weight_scale": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.22.down_proj.weight": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.22.down_proj.weight_scale": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.22.gate_proj.weight": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.22.gate_proj.weight_scale": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.22.up_proj.weight": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.22.up_proj.weight_scale": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.23.down_proj.weight": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.23.down_proj.weight_scale": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.23.gate_proj.weight": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.23.gate_proj.weight_scale": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.23.up_proj.weight": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.23.up_proj.weight_scale": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.24.down_proj.weight": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.24.down_proj.weight_scale": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.24.gate_proj.weight": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.24.gate_proj.weight_scale": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.24.up_proj.weight": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.24.up_proj.weight_scale": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.25.down_proj.weight": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.25.down_proj.weight_scale": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.25.gate_proj.weight": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.25.gate_proj.weight_scale": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.25.up_proj.weight": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.25.up_proj.weight_scale": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.26.down_proj.weight": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.26.down_proj.weight_scale": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.26.gate_proj.weight": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.26.gate_proj.weight_scale": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.26.up_proj.weight": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.26.up_proj.weight_scale": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.27.down_proj.weight": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.27.down_proj.weight_scale": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.27.gate_proj.weight": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.27.gate_proj.weight_scale": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.27.up_proj.weight": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.27.up_proj.weight_scale": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.28.down_proj.weight": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.28.down_proj.weight_scale": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.28.gate_proj.weight": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.28.gate_proj.weight_scale": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.28.up_proj.weight": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.28.up_proj.weight_scale": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.29.down_proj.weight": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.29.down_proj.weight_scale": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.29.gate_proj.weight": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.29.gate_proj.weight_scale": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.29.up_proj.weight": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.29.up_proj.weight_scale": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.3.down_proj.weight": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.3.down_proj.weight_scale": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.3.gate_proj.weight": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.3.gate_proj.weight_scale": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.3.up_proj.weight": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.3.up_proj.weight_scale": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.30.down_proj.weight": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.30.down_proj.weight_scale": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.30.gate_proj.weight": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.30.gate_proj.weight_scale": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.30.up_proj.weight": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.30.up_proj.weight_scale": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.31.down_proj.weight": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.31.down_proj.weight_scale": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.31.gate_proj.weight": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.31.gate_proj.weight_scale": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.31.up_proj.weight": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.31.up_proj.weight_scale": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.32.down_proj.weight": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.32.down_proj.weight_scale": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.32.gate_proj.weight": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.32.gate_proj.weight_scale": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.32.up_proj.weight": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.32.up_proj.weight_scale": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.33.down_proj.weight": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.33.down_proj.weight_scale": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.33.gate_proj.weight": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.33.gate_proj.weight_scale": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.33.up_proj.weight": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.33.up_proj.weight_scale": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.34.down_proj.weight": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.34.down_proj.weight_scale": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.34.gate_proj.weight": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.34.gate_proj.weight_scale": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.34.up_proj.weight": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.34.up_proj.weight_scale": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.35.down_proj.weight": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.35.down_proj.weight_scale": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.35.gate_proj.weight": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.35.gate_proj.weight_scale": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.35.up_proj.weight": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.35.up_proj.weight_scale": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.36.down_proj.weight": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.36.down_proj.weight_scale": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.36.gate_proj.weight": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.36.gate_proj.weight_scale": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.36.up_proj.weight": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.36.up_proj.weight_scale": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.37.down_proj.weight": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.37.down_proj.weight_scale": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.37.gate_proj.weight": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.37.gate_proj.weight_scale": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.37.up_proj.weight": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.37.up_proj.weight_scale": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.38.down_proj.weight": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.38.down_proj.weight_scale": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.38.gate_proj.weight": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.38.gate_proj.weight_scale": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.38.up_proj.weight": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.38.up_proj.weight_scale": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.39.down_proj.weight": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.39.down_proj.weight_scale": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.39.gate_proj.weight": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.39.gate_proj.weight_scale": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.39.up_proj.weight": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.39.up_proj.weight_scale": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.4.down_proj.weight": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.4.down_proj.weight_scale": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.4.gate_proj.weight": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.4.gate_proj.weight_scale": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.4.up_proj.weight": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.4.up_proj.weight_scale": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.40.down_proj.weight": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.40.down_proj.weight_scale": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.40.gate_proj.weight": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.40.gate_proj.weight_scale": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.40.up_proj.weight": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.40.up_proj.weight_scale": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.41.down_proj.weight": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.41.down_proj.weight_scale": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.41.gate_proj.weight": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.41.gate_proj.weight_scale": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.41.up_proj.weight": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.41.up_proj.weight_scale": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.42.down_proj.weight": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.42.down_proj.weight_scale": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.42.gate_proj.weight": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.42.gate_proj.weight_scale": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.42.up_proj.weight": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.42.up_proj.weight_scale": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.43.down_proj.weight": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.43.down_proj.weight_scale": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.43.gate_proj.weight": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.43.gate_proj.weight_scale": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.43.up_proj.weight": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.43.up_proj.weight_scale": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.44.down_proj.weight": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.44.down_proj.weight_scale": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.44.gate_proj.weight": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.44.gate_proj.weight_scale": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.44.up_proj.weight": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.44.up_proj.weight_scale": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.45.down_proj.weight": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.45.down_proj.weight_scale": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.45.gate_proj.weight": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.45.gate_proj.weight_scale": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.45.up_proj.weight": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.45.up_proj.weight_scale": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.46.down_proj.weight": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.46.down_proj.weight_scale": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.46.gate_proj.weight": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.46.gate_proj.weight_scale": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.46.up_proj.weight": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.46.up_proj.weight_scale": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.47.down_proj.weight": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.47.down_proj.weight_scale": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.47.gate_proj.weight": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.47.gate_proj.weight_scale": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.47.up_proj.weight": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.47.up_proj.weight_scale": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.48.down_proj.weight": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.48.down_proj.weight_scale": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.48.gate_proj.weight": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.48.gate_proj.weight_scale": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.48.up_proj.weight": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.48.up_proj.weight_scale": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.49.down_proj.weight": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.49.down_proj.weight_scale": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.49.gate_proj.weight": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.49.gate_proj.weight_scale": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.49.up_proj.weight": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.49.up_proj.weight_scale": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.5.down_proj.weight": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.5.down_proj.weight_scale": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.5.gate_proj.weight": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.5.gate_proj.weight_scale": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.5.up_proj.weight": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.5.up_proj.weight_scale": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.50.down_proj.weight": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.50.down_proj.weight_scale": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.50.gate_proj.weight": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.50.gate_proj.weight_scale": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.50.up_proj.weight": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.50.up_proj.weight_scale": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.51.down_proj.weight": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.51.down_proj.weight_scale": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.51.gate_proj.weight": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.51.gate_proj.weight_scale": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.51.up_proj.weight": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.51.up_proj.weight_scale": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.52.down_proj.weight": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.52.down_proj.weight_scale": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.52.gate_proj.weight": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.52.gate_proj.weight_scale": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.52.up_proj.weight": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.52.up_proj.weight_scale": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.53.down_proj.weight": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.53.down_proj.weight_scale": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.53.gate_proj.weight": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.53.gate_proj.weight_scale": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.53.up_proj.weight": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.53.up_proj.weight_scale": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.54.down_proj.weight": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.54.down_proj.weight_scale": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.54.gate_proj.weight": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.54.gate_proj.weight_scale": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.54.up_proj.weight": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.54.up_proj.weight_scale": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.55.down_proj.weight": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.55.down_proj.weight_scale": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.55.gate_proj.weight": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.55.gate_proj.weight_scale": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.55.up_proj.weight": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.55.up_proj.weight_scale": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.56.down_proj.weight": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.56.down_proj.weight_scale": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.56.gate_proj.weight": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.56.gate_proj.weight_scale": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.56.up_proj.weight": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.56.up_proj.weight_scale": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.57.down_proj.weight": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.57.down_proj.weight_scale": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.57.gate_proj.weight": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.57.gate_proj.weight_scale": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.57.up_proj.weight": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.57.up_proj.weight_scale": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.58.down_proj.weight": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.58.down_proj.weight_scale": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.58.gate_proj.weight": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.58.gate_proj.weight_scale": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.58.up_proj.weight": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.58.up_proj.weight_scale": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.59.down_proj.weight": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.59.down_proj.weight_scale": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.59.gate_proj.weight": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.59.gate_proj.weight_scale": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.59.up_proj.weight": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.59.up_proj.weight_scale": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.6.down_proj.weight": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.6.down_proj.weight_scale": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.6.gate_proj.weight": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.6.gate_proj.weight_scale": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.6.up_proj.weight": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.6.up_proj.weight_scale": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.60.down_proj.weight": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.60.down_proj.weight_scale": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.60.gate_proj.weight": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.60.gate_proj.weight_scale": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.60.up_proj.weight": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.60.up_proj.weight_scale": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.61.down_proj.weight": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.61.down_proj.weight_scale": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.61.gate_proj.weight": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.61.gate_proj.weight_scale": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.61.up_proj.weight": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.61.up_proj.weight_scale": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.62.down_proj.weight": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.62.down_proj.weight_scale": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.62.gate_proj.weight": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.62.gate_proj.weight_scale": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.62.up_proj.weight": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.62.up_proj.weight_scale": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.63.down_proj.weight": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.63.down_proj.weight_scale": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.63.gate_proj.weight": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.63.gate_proj.weight_scale": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.63.up_proj.weight": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.63.up_proj.weight_scale": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.64.down_proj.weight": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.64.down_proj.weight_scale": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.64.gate_proj.weight": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.64.gate_proj.weight_scale": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.64.up_proj.weight": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.64.up_proj.weight_scale": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.65.down_proj.weight": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.65.down_proj.weight_scale": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.65.gate_proj.weight": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.65.gate_proj.weight_scale": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.65.up_proj.weight": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.65.up_proj.weight_scale": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.66.down_proj.weight": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.66.down_proj.weight_scale": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.66.gate_proj.weight": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.66.gate_proj.weight_scale": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.66.up_proj.weight": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.66.up_proj.weight_scale": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.67.down_proj.weight": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.67.down_proj.weight_scale": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.67.gate_proj.weight": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.67.gate_proj.weight_scale": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.67.up_proj.weight": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.67.up_proj.weight_scale": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.68.down_proj.weight": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.68.down_proj.weight_scale": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.68.gate_proj.weight": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.68.gate_proj.weight_scale": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.68.up_proj.weight": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.68.up_proj.weight_scale": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.69.down_proj.weight": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.69.down_proj.weight_scale": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.69.gate_proj.weight": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.69.gate_proj.weight_scale": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.69.up_proj.weight": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.69.up_proj.weight_scale": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.7.down_proj.weight": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.7.down_proj.weight_scale": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.7.gate_proj.weight": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.7.gate_proj.weight_scale": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.7.up_proj.weight": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.7.up_proj.weight_scale": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.70.down_proj.weight": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.70.down_proj.weight_scale": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.70.gate_proj.weight": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.70.gate_proj.weight_scale": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.70.up_proj.weight": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.70.up_proj.weight_scale": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.71.down_proj.weight": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.71.down_proj.weight_scale": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.71.gate_proj.weight": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.71.gate_proj.weight_scale": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.71.up_proj.weight": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.71.up_proj.weight_scale": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.72.down_proj.weight": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.72.down_proj.weight_scale": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.72.gate_proj.weight": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.72.gate_proj.weight_scale": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.72.up_proj.weight": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.72.up_proj.weight_scale": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.73.down_proj.weight": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.73.down_proj.weight_scale": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.73.gate_proj.weight": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.73.gate_proj.weight_scale": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.73.up_proj.weight": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.73.up_proj.weight_scale": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.74.down_proj.weight": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.74.down_proj.weight_scale": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.74.gate_proj.weight": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.74.gate_proj.weight_scale": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.74.up_proj.weight": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.74.up_proj.weight_scale": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.75.down_proj.weight": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.75.down_proj.weight_scale": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.75.gate_proj.weight": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.75.gate_proj.weight_scale": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.75.up_proj.weight": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.75.up_proj.weight_scale": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.76.down_proj.weight": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.76.down_proj.weight_scale": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.76.gate_proj.weight": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.76.gate_proj.weight_scale": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.76.up_proj.weight": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.76.up_proj.weight_scale": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.77.down_proj.weight": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.77.down_proj.weight_scale": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.77.gate_proj.weight": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.77.gate_proj.weight_scale": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.77.up_proj.weight": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.77.up_proj.weight_scale": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.78.down_proj.weight": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.78.down_proj.weight_scale": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.78.gate_proj.weight": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.78.gate_proj.weight_scale": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.78.up_proj.weight": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.78.up_proj.weight_scale": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.79.down_proj.weight": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.79.down_proj.weight_scale": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.79.gate_proj.weight": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.79.gate_proj.weight_scale": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.79.up_proj.weight": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.79.up_proj.weight_scale": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.8.down_proj.weight": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.8.down_proj.weight_scale": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.8.gate_proj.weight": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.8.gate_proj.weight_scale": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.8.up_proj.weight": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.8.up_proj.weight_scale": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.80.down_proj.weight": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.80.down_proj.weight_scale": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.80.gate_proj.weight": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.80.gate_proj.weight_scale": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.80.up_proj.weight": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.80.up_proj.weight_scale": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.81.down_proj.weight": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.81.down_proj.weight_scale": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.81.gate_proj.weight": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.81.gate_proj.weight_scale": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.81.up_proj.weight": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.81.up_proj.weight_scale": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.82.down_proj.weight": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.82.down_proj.weight_scale": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.82.gate_proj.weight": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.82.gate_proj.weight_scale": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.82.up_proj.weight": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.82.up_proj.weight_scale": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.83.down_proj.weight": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.83.down_proj.weight_scale": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.83.gate_proj.weight": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.83.gate_proj.weight_scale": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.83.up_proj.weight": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.83.up_proj.weight_scale": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.84.down_proj.weight": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.84.down_proj.weight_scale": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.84.gate_proj.weight": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.84.gate_proj.weight_scale": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.84.up_proj.weight": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.84.up_proj.weight_scale": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.85.down_proj.weight": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.85.down_proj.weight_scale": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.85.gate_proj.weight": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.85.gate_proj.weight_scale": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.85.up_proj.weight": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.85.up_proj.weight_scale": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.86.down_proj.weight": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.86.down_proj.weight_scale": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.86.gate_proj.weight": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.86.gate_proj.weight_scale": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.86.up_proj.weight": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.86.up_proj.weight_scale": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.87.down_proj.weight": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.87.down_proj.weight_scale": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.87.gate_proj.weight": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.87.gate_proj.weight_scale": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.87.up_proj.weight": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.87.up_proj.weight_scale": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.88.down_proj.weight": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.88.down_proj.weight_scale": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.88.gate_proj.weight": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.88.gate_proj.weight_scale": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.88.up_proj.weight": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.88.up_proj.weight_scale": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.89.down_proj.weight": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.89.down_proj.weight_scale": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.89.gate_proj.weight": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.89.gate_proj.weight_scale": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.89.up_proj.weight": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.89.up_proj.weight_scale": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.9.down_proj.weight": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.9.down_proj.weight_scale": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.9.gate_proj.weight": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.9.gate_proj.weight_scale": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.9.up_proj.weight": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.9.up_proj.weight_scale": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.90.down_proj.weight": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.90.down_proj.weight_scale": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.90.gate_proj.weight": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.90.gate_proj.weight_scale": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.90.up_proj.weight": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.90.up_proj.weight_scale": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.91.down_proj.weight": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.91.down_proj.weight_scale": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.91.gate_proj.weight": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.91.gate_proj.weight_scale": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.91.up_proj.weight": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.91.up_proj.weight_scale": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.92.down_proj.weight": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.92.down_proj.weight_scale": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.92.gate_proj.weight": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.92.gate_proj.weight_scale": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.92.up_proj.weight": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.92.up_proj.weight_scale": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.93.down_proj.weight": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.93.down_proj.weight_scale": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.93.gate_proj.weight": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.93.gate_proj.weight_scale": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.93.up_proj.weight": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.93.up_proj.weight_scale": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.94.down_proj.weight": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.94.down_proj.weight_scale": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.94.gate_proj.weight": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.94.gate_proj.weight_scale": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.94.up_proj.weight": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.94.up_proj.weight_scale": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.95.down_proj.weight": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.95.down_proj.weight_scale": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.95.gate_proj.weight": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.95.gate_proj.weight_scale": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.95.up_proj.weight": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.95.up_proj.weight_scale": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.96.down_proj.weight": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.96.down_proj.weight_scale": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.96.gate_proj.weight": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.96.gate_proj.weight_scale": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.96.up_proj.weight": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.96.up_proj.weight_scale": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.97.down_proj.weight": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.97.down_proj.weight_scale": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.97.gate_proj.weight": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.97.gate_proj.weight_scale": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.97.up_proj.weight": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.97.up_proj.weight_scale": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.98.down_proj.weight": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.98.down_proj.weight_scale": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.98.gate_proj.weight": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.98.gate_proj.weight_scale": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.98.up_proj.weight": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.98.up_proj.weight_scale": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.99.down_proj.weight": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.99.down_proj.weight_scale": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.99.gate_proj.weight": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.99.gate_proj.weight_scale": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.99.up_proj.weight": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.99.up_proj.weight_scale": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.gate.e_score_correction_bias": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.gate.weight": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.shared_experts.down_proj.weight": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.shared_experts.down_proj.weight_scale": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.shared_experts.gate_proj.weight": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.shared_experts.gate_proj.weight_scale": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.shared_experts.up_proj.weight": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.shared_experts.up_proj.weight_scale": "model-00040-of-00092.safetensors",
+ "model.layers.39.post_attention_layernorm.weight": "model-00040-of-00092.safetensors",
+ "model.layers.39.self_attn.k_norm.weight": "model-00040-of-00092.safetensors",
+ "model.layers.39.self_attn.k_proj.bias": "model-00040-of-00092.safetensors",
+ "model.layers.39.self_attn.k_proj.weight": "model-00040-of-00092.safetensors",
+ "model.layers.39.self_attn.k_proj.weight_scale": "model-00040-of-00092.safetensors",
+ "model.layers.39.self_attn.o_proj.weight": "model-00040-of-00092.safetensors",
+ "model.layers.39.self_attn.o_proj.weight_scale": "model-00040-of-00092.safetensors",
+ "model.layers.39.self_attn.q_norm.weight": "model-00040-of-00092.safetensors",
+ "model.layers.39.self_attn.q_proj.bias": "model-00040-of-00092.safetensors",
+ "model.layers.39.self_attn.q_proj.weight": "model-00040-of-00092.safetensors",
+ "model.layers.39.self_attn.q_proj.weight_scale": "model-00040-of-00092.safetensors",
+ "model.layers.39.self_attn.v_proj.bias": "model-00040-of-00092.safetensors",
+ "model.layers.39.self_attn.v_proj.weight": "model-00040-of-00092.safetensors",
+ "model.layers.39.self_attn.v_proj.weight_scale": "model-00040-of-00092.safetensors",
+ "model.layers.40.input_layernorm.weight": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.0.down_proj.weight": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.0.down_proj.weight_scale": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.0.gate_proj.weight": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.0.gate_proj.weight_scale": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.0.up_proj.weight": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.0.up_proj.weight_scale": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.1.down_proj.weight": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.1.down_proj.weight_scale": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.1.gate_proj.weight": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.1.gate_proj.weight_scale": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.1.up_proj.weight": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.1.up_proj.weight_scale": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.10.down_proj.weight": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.10.down_proj.weight_scale": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.10.gate_proj.weight": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.10.gate_proj.weight_scale": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.10.up_proj.weight": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.10.up_proj.weight_scale": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.100.down_proj.weight": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.100.down_proj.weight_scale": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.100.gate_proj.weight": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.100.gate_proj.weight_scale": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.100.up_proj.weight": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.100.up_proj.weight_scale": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.101.down_proj.weight": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.101.down_proj.weight_scale": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.101.gate_proj.weight": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.101.gate_proj.weight_scale": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.101.up_proj.weight": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.101.up_proj.weight_scale": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.102.down_proj.weight": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.102.down_proj.weight_scale": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.102.gate_proj.weight": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.102.gate_proj.weight_scale": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.102.up_proj.weight": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.102.up_proj.weight_scale": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.103.down_proj.weight": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.103.down_proj.weight_scale": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.103.gate_proj.weight": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.103.gate_proj.weight_scale": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.103.up_proj.weight": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.103.up_proj.weight_scale": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.104.down_proj.weight": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.104.down_proj.weight_scale": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.104.gate_proj.weight": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.104.gate_proj.weight_scale": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.104.up_proj.weight": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.104.up_proj.weight_scale": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.105.down_proj.weight": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.105.down_proj.weight_scale": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.105.gate_proj.weight": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.105.gate_proj.weight_scale": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.105.up_proj.weight": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.105.up_proj.weight_scale": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.106.down_proj.weight": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.106.down_proj.weight_scale": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.106.gate_proj.weight": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.106.gate_proj.weight_scale": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.106.up_proj.weight": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.106.up_proj.weight_scale": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.107.down_proj.weight": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.107.down_proj.weight_scale": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.107.gate_proj.weight": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.107.gate_proj.weight_scale": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.107.up_proj.weight": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.107.up_proj.weight_scale": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.108.down_proj.weight": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.108.down_proj.weight_scale": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.108.gate_proj.weight": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.108.gate_proj.weight_scale": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.108.up_proj.weight": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.108.up_proj.weight_scale": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.109.down_proj.weight": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.109.down_proj.weight_scale": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.109.gate_proj.weight": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.109.gate_proj.weight_scale": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.109.up_proj.weight": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.109.up_proj.weight_scale": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.11.down_proj.weight": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.11.down_proj.weight_scale": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.11.gate_proj.weight": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.11.gate_proj.weight_scale": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.11.up_proj.weight": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.11.up_proj.weight_scale": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.110.down_proj.weight": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.110.down_proj.weight_scale": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.110.gate_proj.weight": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.110.gate_proj.weight_scale": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.110.up_proj.weight": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.110.up_proj.weight_scale": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.111.down_proj.weight": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.111.down_proj.weight_scale": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.111.gate_proj.weight": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.111.gate_proj.weight_scale": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.111.up_proj.weight": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.111.up_proj.weight_scale": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.112.down_proj.weight": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.112.down_proj.weight_scale": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.112.gate_proj.weight": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.112.gate_proj.weight_scale": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.112.up_proj.weight": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.112.up_proj.weight_scale": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.113.down_proj.weight": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.113.down_proj.weight_scale": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.113.gate_proj.weight": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.113.gate_proj.weight_scale": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.113.up_proj.weight": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.113.up_proj.weight_scale": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.114.down_proj.weight": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.114.down_proj.weight_scale": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.114.gate_proj.weight": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.114.gate_proj.weight_scale": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.114.up_proj.weight": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.114.up_proj.weight_scale": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.115.down_proj.weight": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.115.down_proj.weight_scale": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.115.gate_proj.weight": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.115.gate_proj.weight_scale": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.115.up_proj.weight": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.115.up_proj.weight_scale": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.116.down_proj.weight": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.116.down_proj.weight_scale": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.116.gate_proj.weight": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.116.gate_proj.weight_scale": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.116.up_proj.weight": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.116.up_proj.weight_scale": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.117.down_proj.weight": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.117.down_proj.weight_scale": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.117.gate_proj.weight": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.117.gate_proj.weight_scale": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.117.up_proj.weight": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.117.up_proj.weight_scale": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.118.down_proj.weight": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.118.down_proj.weight_scale": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.118.gate_proj.weight": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.118.gate_proj.weight_scale": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.118.up_proj.weight": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.118.up_proj.weight_scale": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.119.down_proj.weight": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.119.down_proj.weight_scale": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.119.gate_proj.weight": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.119.gate_proj.weight_scale": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.119.up_proj.weight": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.119.up_proj.weight_scale": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.12.down_proj.weight": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.12.down_proj.weight_scale": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.12.gate_proj.weight": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.12.gate_proj.weight_scale": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.12.up_proj.weight": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.12.up_proj.weight_scale": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.120.down_proj.weight": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.120.down_proj.weight_scale": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.120.gate_proj.weight": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.120.gate_proj.weight_scale": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.120.up_proj.weight": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.120.up_proj.weight_scale": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.121.down_proj.weight": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.121.down_proj.weight_scale": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.121.gate_proj.weight": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.121.gate_proj.weight_scale": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.121.up_proj.weight": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.121.up_proj.weight_scale": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.122.down_proj.weight": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.122.down_proj.weight_scale": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.122.gate_proj.weight": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.122.gate_proj.weight_scale": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.122.up_proj.weight": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.122.up_proj.weight_scale": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.123.down_proj.weight": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.123.down_proj.weight_scale": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.123.gate_proj.weight": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.123.gate_proj.weight_scale": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.123.up_proj.weight": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.123.up_proj.weight_scale": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.124.down_proj.weight": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.124.down_proj.weight_scale": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.124.gate_proj.weight": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.124.gate_proj.weight_scale": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.124.up_proj.weight": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.124.up_proj.weight_scale": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.125.down_proj.weight": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.125.down_proj.weight_scale": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.125.gate_proj.weight": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.125.gate_proj.weight_scale": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.125.up_proj.weight": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.125.up_proj.weight_scale": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.126.down_proj.weight": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.126.down_proj.weight_scale": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.126.gate_proj.weight": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.126.gate_proj.weight_scale": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.126.up_proj.weight": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.126.up_proj.weight_scale": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.127.down_proj.weight": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.127.down_proj.weight_scale": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.127.gate_proj.weight": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.127.gate_proj.weight_scale": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.127.up_proj.weight": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.127.up_proj.weight_scale": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.128.down_proj.weight": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.128.down_proj.weight_scale": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.128.gate_proj.weight": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.128.gate_proj.weight_scale": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.128.up_proj.weight": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.128.up_proj.weight_scale": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.129.down_proj.weight": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.129.down_proj.weight_scale": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.129.gate_proj.weight": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.129.gate_proj.weight_scale": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.129.up_proj.weight": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.129.up_proj.weight_scale": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.13.down_proj.weight": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.13.down_proj.weight_scale": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.13.gate_proj.weight": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.13.gate_proj.weight_scale": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.13.up_proj.weight": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.13.up_proj.weight_scale": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.130.down_proj.weight": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.130.down_proj.weight_scale": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.130.gate_proj.weight": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.130.gate_proj.weight_scale": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.130.up_proj.weight": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.130.up_proj.weight_scale": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.131.down_proj.weight": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.131.down_proj.weight_scale": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.131.gate_proj.weight": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.131.gate_proj.weight_scale": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.131.up_proj.weight": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.131.up_proj.weight_scale": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.132.down_proj.weight": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.132.down_proj.weight_scale": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.132.gate_proj.weight": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.132.gate_proj.weight_scale": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.132.up_proj.weight": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.132.up_proj.weight_scale": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.133.down_proj.weight": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.133.down_proj.weight_scale": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.133.gate_proj.weight": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.133.gate_proj.weight_scale": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.133.up_proj.weight": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.133.up_proj.weight_scale": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.134.down_proj.weight": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.134.down_proj.weight_scale": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.134.gate_proj.weight": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.134.gate_proj.weight_scale": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.134.up_proj.weight": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.134.up_proj.weight_scale": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.135.down_proj.weight": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.135.down_proj.weight_scale": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.135.gate_proj.weight": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.135.gate_proj.weight_scale": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.135.up_proj.weight": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.135.up_proj.weight_scale": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.136.down_proj.weight": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.136.down_proj.weight_scale": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.136.gate_proj.weight": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.136.gate_proj.weight_scale": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.136.up_proj.weight": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.136.up_proj.weight_scale": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.137.down_proj.weight": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.137.down_proj.weight_scale": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.137.gate_proj.weight": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.137.gate_proj.weight_scale": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.137.up_proj.weight": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.137.up_proj.weight_scale": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.138.down_proj.weight": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.138.down_proj.weight_scale": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.138.gate_proj.weight": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.138.gate_proj.weight_scale": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.138.up_proj.weight": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.138.up_proj.weight_scale": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.139.down_proj.weight": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.139.down_proj.weight_scale": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.139.gate_proj.weight": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.139.gate_proj.weight_scale": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.139.up_proj.weight": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.139.up_proj.weight_scale": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.14.down_proj.weight": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.14.down_proj.weight_scale": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.14.gate_proj.weight": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.14.gate_proj.weight_scale": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.14.up_proj.weight": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.14.up_proj.weight_scale": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.140.down_proj.weight": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.140.down_proj.weight_scale": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.140.gate_proj.weight": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.140.gate_proj.weight_scale": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.140.up_proj.weight": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.140.up_proj.weight_scale": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.141.down_proj.weight": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.141.down_proj.weight_scale": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.141.gate_proj.weight": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.141.gate_proj.weight_scale": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.141.up_proj.weight": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.141.up_proj.weight_scale": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.142.down_proj.weight": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.142.down_proj.weight_scale": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.142.gate_proj.weight": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.142.gate_proj.weight_scale": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.142.up_proj.weight": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.142.up_proj.weight_scale": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.143.down_proj.weight": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.143.down_proj.weight_scale": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.143.gate_proj.weight": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.143.gate_proj.weight_scale": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.143.up_proj.weight": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.143.up_proj.weight_scale": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.144.down_proj.weight": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.144.down_proj.weight_scale": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.144.gate_proj.weight": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.144.gate_proj.weight_scale": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.144.up_proj.weight": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.144.up_proj.weight_scale": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.145.down_proj.weight": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.145.down_proj.weight_scale": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.145.gate_proj.weight": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.145.gate_proj.weight_scale": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.145.up_proj.weight": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.145.up_proj.weight_scale": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.146.down_proj.weight": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.146.down_proj.weight_scale": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.146.gate_proj.weight": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.146.gate_proj.weight_scale": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.146.up_proj.weight": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.146.up_proj.weight_scale": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.147.down_proj.weight": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.147.down_proj.weight_scale": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.147.gate_proj.weight": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.147.gate_proj.weight_scale": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.147.up_proj.weight": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.147.up_proj.weight_scale": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.148.down_proj.weight": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.148.down_proj.weight_scale": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.148.gate_proj.weight": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.148.gate_proj.weight_scale": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.148.up_proj.weight": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.148.up_proj.weight_scale": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.149.down_proj.weight": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.149.down_proj.weight_scale": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.149.gate_proj.weight": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.149.gate_proj.weight_scale": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.149.up_proj.weight": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.149.up_proj.weight_scale": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.15.down_proj.weight": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.15.down_proj.weight_scale": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.15.gate_proj.weight": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.15.gate_proj.weight_scale": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.15.up_proj.weight": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.15.up_proj.weight_scale": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.150.down_proj.weight": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.150.down_proj.weight_scale": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.150.gate_proj.weight": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.150.gate_proj.weight_scale": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.150.up_proj.weight": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.150.up_proj.weight_scale": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.151.down_proj.weight": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.151.down_proj.weight_scale": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.151.gate_proj.weight": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.151.gate_proj.weight_scale": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.151.up_proj.weight": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.151.up_proj.weight_scale": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.152.down_proj.weight": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.152.down_proj.weight_scale": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.152.gate_proj.weight": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.152.gate_proj.weight_scale": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.152.up_proj.weight": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.152.up_proj.weight_scale": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.153.down_proj.weight": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.153.down_proj.weight_scale": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.153.gate_proj.weight": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.153.gate_proj.weight_scale": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.153.up_proj.weight": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.153.up_proj.weight_scale": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.154.down_proj.weight": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.154.down_proj.weight_scale": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.154.gate_proj.weight": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.154.gate_proj.weight_scale": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.154.up_proj.weight": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.154.up_proj.weight_scale": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.155.down_proj.weight": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.155.down_proj.weight_scale": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.155.gate_proj.weight": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.155.gate_proj.weight_scale": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.155.up_proj.weight": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.155.up_proj.weight_scale": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.156.down_proj.weight": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.156.down_proj.weight_scale": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.156.gate_proj.weight": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.156.gate_proj.weight_scale": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.156.up_proj.weight": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.156.up_proj.weight_scale": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.157.down_proj.weight": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.157.down_proj.weight_scale": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.157.gate_proj.weight": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.157.gate_proj.weight_scale": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.157.up_proj.weight": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.157.up_proj.weight_scale": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.158.down_proj.weight": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.158.down_proj.weight_scale": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.158.gate_proj.weight": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.158.gate_proj.weight_scale": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.158.up_proj.weight": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.158.up_proj.weight_scale": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.159.down_proj.weight": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.159.down_proj.weight_scale": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.159.gate_proj.weight": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.159.gate_proj.weight_scale": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.159.up_proj.weight": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.159.up_proj.weight_scale": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.16.down_proj.weight": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.16.down_proj.weight_scale": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.16.gate_proj.weight": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.16.gate_proj.weight_scale": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.16.up_proj.weight": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.16.up_proj.weight_scale": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.17.down_proj.weight": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.17.down_proj.weight_scale": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.17.gate_proj.weight": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.17.gate_proj.weight_scale": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.17.up_proj.weight": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.17.up_proj.weight_scale": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.18.down_proj.weight": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.18.down_proj.weight_scale": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.18.gate_proj.weight": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.18.gate_proj.weight_scale": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.18.up_proj.weight": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.18.up_proj.weight_scale": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.19.down_proj.weight": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.19.down_proj.weight_scale": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.19.gate_proj.weight": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.19.gate_proj.weight_scale": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.19.up_proj.weight": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.19.up_proj.weight_scale": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.2.down_proj.weight": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.2.down_proj.weight_scale": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.2.gate_proj.weight": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.2.gate_proj.weight_scale": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.2.up_proj.weight": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.2.up_proj.weight_scale": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.20.down_proj.weight": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.20.down_proj.weight_scale": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.20.gate_proj.weight": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.20.gate_proj.weight_scale": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.20.up_proj.weight": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.20.up_proj.weight_scale": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.21.down_proj.weight": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.21.down_proj.weight_scale": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.21.gate_proj.weight": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.21.gate_proj.weight_scale": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.21.up_proj.weight": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.21.up_proj.weight_scale": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.22.down_proj.weight": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.22.down_proj.weight_scale": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.22.gate_proj.weight": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.22.gate_proj.weight_scale": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.22.up_proj.weight": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.22.up_proj.weight_scale": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.23.down_proj.weight": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.23.down_proj.weight_scale": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.23.gate_proj.weight": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.23.gate_proj.weight_scale": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.23.up_proj.weight": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.23.up_proj.weight_scale": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.24.down_proj.weight": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.24.down_proj.weight_scale": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.24.gate_proj.weight": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.24.gate_proj.weight_scale": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.24.up_proj.weight": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.24.up_proj.weight_scale": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.25.down_proj.weight": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.25.down_proj.weight_scale": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.25.gate_proj.weight": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.25.gate_proj.weight_scale": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.25.up_proj.weight": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.25.up_proj.weight_scale": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.26.down_proj.weight": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.26.down_proj.weight_scale": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.26.gate_proj.weight": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.26.gate_proj.weight_scale": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.26.up_proj.weight": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.26.up_proj.weight_scale": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.27.down_proj.weight": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.27.down_proj.weight_scale": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.27.gate_proj.weight": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.27.gate_proj.weight_scale": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.27.up_proj.weight": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.27.up_proj.weight_scale": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.28.down_proj.weight": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.28.down_proj.weight_scale": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.28.gate_proj.weight": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.28.gate_proj.weight_scale": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.28.up_proj.weight": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.28.up_proj.weight_scale": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.29.down_proj.weight": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.29.down_proj.weight_scale": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.29.gate_proj.weight": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.29.gate_proj.weight_scale": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.29.up_proj.weight": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.29.up_proj.weight_scale": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.3.down_proj.weight": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.3.down_proj.weight_scale": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.3.gate_proj.weight": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.3.gate_proj.weight_scale": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.3.up_proj.weight": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.3.up_proj.weight_scale": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.30.down_proj.weight": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.30.down_proj.weight_scale": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.30.gate_proj.weight": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.30.gate_proj.weight_scale": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.30.up_proj.weight": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.30.up_proj.weight_scale": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.31.down_proj.weight": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.31.down_proj.weight_scale": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.31.gate_proj.weight": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.31.gate_proj.weight_scale": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.31.up_proj.weight": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.31.up_proj.weight_scale": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.32.down_proj.weight": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.32.down_proj.weight_scale": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.32.gate_proj.weight": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.32.gate_proj.weight_scale": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.32.up_proj.weight": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.32.up_proj.weight_scale": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.33.down_proj.weight": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.33.down_proj.weight_scale": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.33.gate_proj.weight": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.33.gate_proj.weight_scale": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.33.up_proj.weight": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.33.up_proj.weight_scale": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.34.down_proj.weight": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.34.down_proj.weight_scale": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.34.gate_proj.weight": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.34.gate_proj.weight_scale": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.34.up_proj.weight": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.34.up_proj.weight_scale": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.35.down_proj.weight": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.35.down_proj.weight_scale": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.35.gate_proj.weight": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.35.gate_proj.weight_scale": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.35.up_proj.weight": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.35.up_proj.weight_scale": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.36.down_proj.weight": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.36.down_proj.weight_scale": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.36.gate_proj.weight": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.36.gate_proj.weight_scale": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.36.up_proj.weight": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.36.up_proj.weight_scale": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.37.down_proj.weight": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.37.down_proj.weight_scale": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.37.gate_proj.weight": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.37.gate_proj.weight_scale": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.37.up_proj.weight": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.37.up_proj.weight_scale": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.38.down_proj.weight": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.38.down_proj.weight_scale": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.38.gate_proj.weight": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.38.gate_proj.weight_scale": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.38.up_proj.weight": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.38.up_proj.weight_scale": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.39.down_proj.weight": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.39.down_proj.weight_scale": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.39.gate_proj.weight": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.39.gate_proj.weight_scale": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.39.up_proj.weight": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.39.up_proj.weight_scale": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.4.down_proj.weight": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.4.down_proj.weight_scale": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.4.gate_proj.weight": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.4.gate_proj.weight_scale": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.4.up_proj.weight": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.4.up_proj.weight_scale": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.40.down_proj.weight": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.40.down_proj.weight_scale": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.40.gate_proj.weight": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.40.gate_proj.weight_scale": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.40.up_proj.weight": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.40.up_proj.weight_scale": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.41.down_proj.weight": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.41.down_proj.weight_scale": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.41.gate_proj.weight": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.41.gate_proj.weight_scale": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.41.up_proj.weight": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.41.up_proj.weight_scale": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.42.down_proj.weight": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.42.down_proj.weight_scale": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.42.gate_proj.weight": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.42.gate_proj.weight_scale": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.42.up_proj.weight": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.42.up_proj.weight_scale": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.43.down_proj.weight": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.43.down_proj.weight_scale": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.43.gate_proj.weight": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.43.gate_proj.weight_scale": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.43.up_proj.weight": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.43.up_proj.weight_scale": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.44.down_proj.weight": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.44.down_proj.weight_scale": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.44.gate_proj.weight": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.44.gate_proj.weight_scale": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.44.up_proj.weight": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.44.up_proj.weight_scale": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.45.down_proj.weight": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.45.down_proj.weight_scale": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.45.gate_proj.weight": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.45.gate_proj.weight_scale": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.45.up_proj.weight": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.45.up_proj.weight_scale": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.46.down_proj.weight": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.46.down_proj.weight_scale": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.46.gate_proj.weight": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.46.gate_proj.weight_scale": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.46.up_proj.weight": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.46.up_proj.weight_scale": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.47.down_proj.weight": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.47.down_proj.weight_scale": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.47.gate_proj.weight": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.47.gate_proj.weight_scale": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.47.up_proj.weight": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.47.up_proj.weight_scale": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.48.down_proj.weight": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.48.down_proj.weight_scale": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.48.gate_proj.weight": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.48.gate_proj.weight_scale": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.48.up_proj.weight": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.48.up_proj.weight_scale": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.49.down_proj.weight": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.49.down_proj.weight_scale": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.49.gate_proj.weight": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.49.gate_proj.weight_scale": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.49.up_proj.weight": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.49.up_proj.weight_scale": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.5.down_proj.weight": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.5.down_proj.weight_scale": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.5.gate_proj.weight": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.5.gate_proj.weight_scale": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.5.up_proj.weight": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.5.up_proj.weight_scale": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.50.down_proj.weight": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.50.down_proj.weight_scale": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.50.gate_proj.weight": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.50.gate_proj.weight_scale": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.50.up_proj.weight": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.50.up_proj.weight_scale": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.51.down_proj.weight": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.51.down_proj.weight_scale": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.51.gate_proj.weight": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.51.gate_proj.weight_scale": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.51.up_proj.weight": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.51.up_proj.weight_scale": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.52.down_proj.weight": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.52.down_proj.weight_scale": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.52.gate_proj.weight": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.52.gate_proj.weight_scale": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.52.up_proj.weight": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.52.up_proj.weight_scale": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.53.down_proj.weight": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.53.down_proj.weight_scale": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.53.gate_proj.weight": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.53.gate_proj.weight_scale": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.53.up_proj.weight": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.53.up_proj.weight_scale": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.54.down_proj.weight": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.54.down_proj.weight_scale": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.54.gate_proj.weight": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.54.gate_proj.weight_scale": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.54.up_proj.weight": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.54.up_proj.weight_scale": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.55.down_proj.weight": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.55.down_proj.weight_scale": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.55.gate_proj.weight": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.55.gate_proj.weight_scale": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.55.up_proj.weight": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.55.up_proj.weight_scale": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.56.down_proj.weight": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.56.down_proj.weight_scale": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.56.gate_proj.weight": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.56.gate_proj.weight_scale": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.56.up_proj.weight": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.56.up_proj.weight_scale": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.57.down_proj.weight": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.57.down_proj.weight_scale": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.57.gate_proj.weight": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.57.gate_proj.weight_scale": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.57.up_proj.weight": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.57.up_proj.weight_scale": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.58.down_proj.weight": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.58.down_proj.weight_scale": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.58.gate_proj.weight": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.58.gate_proj.weight_scale": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.58.up_proj.weight": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.58.up_proj.weight_scale": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.59.down_proj.weight": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.59.down_proj.weight_scale": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.59.gate_proj.weight": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.59.gate_proj.weight_scale": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.59.up_proj.weight": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.59.up_proj.weight_scale": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.6.down_proj.weight": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.6.down_proj.weight_scale": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.6.gate_proj.weight": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.6.gate_proj.weight_scale": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.6.up_proj.weight": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.6.up_proj.weight_scale": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.60.down_proj.weight": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.60.down_proj.weight_scale": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.60.gate_proj.weight": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.60.gate_proj.weight_scale": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.60.up_proj.weight": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.60.up_proj.weight_scale": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.61.down_proj.weight": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.61.down_proj.weight_scale": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.61.gate_proj.weight": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.61.gate_proj.weight_scale": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.61.up_proj.weight": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.61.up_proj.weight_scale": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.62.down_proj.weight": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.62.down_proj.weight_scale": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.62.gate_proj.weight": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.62.gate_proj.weight_scale": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.62.up_proj.weight": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.62.up_proj.weight_scale": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.63.down_proj.weight": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.63.down_proj.weight_scale": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.63.gate_proj.weight": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.63.gate_proj.weight_scale": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.63.up_proj.weight": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.63.up_proj.weight_scale": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.64.down_proj.weight": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.64.down_proj.weight_scale": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.64.gate_proj.weight": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.64.gate_proj.weight_scale": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.64.up_proj.weight": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.64.up_proj.weight_scale": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.65.down_proj.weight": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.65.down_proj.weight_scale": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.65.gate_proj.weight": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.65.gate_proj.weight_scale": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.65.up_proj.weight": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.65.up_proj.weight_scale": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.66.down_proj.weight": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.66.down_proj.weight_scale": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.66.gate_proj.weight": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.66.gate_proj.weight_scale": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.66.up_proj.weight": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.66.up_proj.weight_scale": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.67.down_proj.weight": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.67.down_proj.weight_scale": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.67.gate_proj.weight": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.67.gate_proj.weight_scale": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.67.up_proj.weight": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.67.up_proj.weight_scale": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.68.down_proj.weight": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.68.down_proj.weight_scale": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.68.gate_proj.weight": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.68.gate_proj.weight_scale": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.68.up_proj.weight": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.68.up_proj.weight_scale": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.69.down_proj.weight": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.69.down_proj.weight_scale": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.69.gate_proj.weight": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.69.gate_proj.weight_scale": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.69.up_proj.weight": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.69.up_proj.weight_scale": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.7.down_proj.weight": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.7.down_proj.weight_scale": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.7.gate_proj.weight": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.7.gate_proj.weight_scale": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.7.up_proj.weight": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.7.up_proj.weight_scale": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.70.down_proj.weight": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.70.down_proj.weight_scale": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.70.gate_proj.weight": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.70.gate_proj.weight_scale": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.70.up_proj.weight": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.70.up_proj.weight_scale": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.71.down_proj.weight": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.71.down_proj.weight_scale": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.71.gate_proj.weight": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.71.gate_proj.weight_scale": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.71.up_proj.weight": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.71.up_proj.weight_scale": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.72.down_proj.weight": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.72.down_proj.weight_scale": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.72.gate_proj.weight": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.72.gate_proj.weight_scale": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.72.up_proj.weight": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.72.up_proj.weight_scale": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.73.down_proj.weight": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.73.down_proj.weight_scale": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.73.gate_proj.weight": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.73.gate_proj.weight_scale": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.73.up_proj.weight": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.73.up_proj.weight_scale": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.74.down_proj.weight": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.74.down_proj.weight_scale": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.74.gate_proj.weight": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.74.gate_proj.weight_scale": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.74.up_proj.weight": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.74.up_proj.weight_scale": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.75.down_proj.weight": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.75.down_proj.weight_scale": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.75.gate_proj.weight": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.75.gate_proj.weight_scale": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.75.up_proj.weight": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.75.up_proj.weight_scale": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.76.down_proj.weight": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.76.down_proj.weight_scale": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.76.gate_proj.weight": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.76.gate_proj.weight_scale": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.76.up_proj.weight": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.76.up_proj.weight_scale": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.77.down_proj.weight": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.77.down_proj.weight_scale": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.77.gate_proj.weight": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.77.gate_proj.weight_scale": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.77.up_proj.weight": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.77.up_proj.weight_scale": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.78.down_proj.weight": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.78.down_proj.weight_scale": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.78.gate_proj.weight": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.78.gate_proj.weight_scale": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.78.up_proj.weight": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.78.up_proj.weight_scale": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.79.down_proj.weight": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.79.down_proj.weight_scale": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.79.gate_proj.weight": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.79.gate_proj.weight_scale": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.79.up_proj.weight": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.79.up_proj.weight_scale": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.8.down_proj.weight": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.8.down_proj.weight_scale": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.8.gate_proj.weight": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.8.gate_proj.weight_scale": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.8.up_proj.weight": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.8.up_proj.weight_scale": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.80.down_proj.weight": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.80.down_proj.weight_scale": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.80.gate_proj.weight": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.80.gate_proj.weight_scale": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.80.up_proj.weight": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.80.up_proj.weight_scale": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.81.down_proj.weight": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.81.down_proj.weight_scale": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.81.gate_proj.weight": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.81.gate_proj.weight_scale": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.81.up_proj.weight": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.81.up_proj.weight_scale": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.82.down_proj.weight": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.82.down_proj.weight_scale": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.82.gate_proj.weight": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.82.gate_proj.weight_scale": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.82.up_proj.weight": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.82.up_proj.weight_scale": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.83.down_proj.weight": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.83.down_proj.weight_scale": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.83.gate_proj.weight": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.83.gate_proj.weight_scale": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.83.up_proj.weight": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.83.up_proj.weight_scale": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.84.down_proj.weight": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.84.down_proj.weight_scale": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.84.gate_proj.weight": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.84.gate_proj.weight_scale": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.84.up_proj.weight": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.84.up_proj.weight_scale": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.85.down_proj.weight": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.85.down_proj.weight_scale": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.85.gate_proj.weight": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.85.gate_proj.weight_scale": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.85.up_proj.weight": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.85.up_proj.weight_scale": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.86.down_proj.weight": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.86.down_proj.weight_scale": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.86.gate_proj.weight": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.86.gate_proj.weight_scale": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.86.up_proj.weight": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.86.up_proj.weight_scale": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.87.down_proj.weight": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.87.down_proj.weight_scale": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.87.gate_proj.weight": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.87.gate_proj.weight_scale": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.87.up_proj.weight": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.87.up_proj.weight_scale": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.88.down_proj.weight": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.88.down_proj.weight_scale": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.88.gate_proj.weight": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.88.gate_proj.weight_scale": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.88.up_proj.weight": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.88.up_proj.weight_scale": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.89.down_proj.weight": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.89.down_proj.weight_scale": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.89.gate_proj.weight": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.89.gate_proj.weight_scale": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.89.up_proj.weight": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.89.up_proj.weight_scale": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.9.down_proj.weight": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.9.down_proj.weight_scale": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.9.gate_proj.weight": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.9.gate_proj.weight_scale": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.9.up_proj.weight": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.9.up_proj.weight_scale": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.90.down_proj.weight": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.90.down_proj.weight_scale": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.90.gate_proj.weight": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.90.gate_proj.weight_scale": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.90.up_proj.weight": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.90.up_proj.weight_scale": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.91.down_proj.weight": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.91.down_proj.weight_scale": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.91.gate_proj.weight": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.91.gate_proj.weight_scale": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.91.up_proj.weight": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.91.up_proj.weight_scale": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.92.down_proj.weight": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.92.down_proj.weight_scale": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.92.gate_proj.weight": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.92.gate_proj.weight_scale": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.92.up_proj.weight": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.92.up_proj.weight_scale": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.93.down_proj.weight": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.93.down_proj.weight_scale": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.93.gate_proj.weight": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.93.gate_proj.weight_scale": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.93.up_proj.weight": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.93.up_proj.weight_scale": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.94.down_proj.weight": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.94.down_proj.weight_scale": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.94.gate_proj.weight": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.94.gate_proj.weight_scale": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.94.up_proj.weight": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.94.up_proj.weight_scale": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.95.down_proj.weight": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.95.down_proj.weight_scale": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.95.gate_proj.weight": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.95.gate_proj.weight_scale": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.95.up_proj.weight": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.95.up_proj.weight_scale": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.96.down_proj.weight": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.96.down_proj.weight_scale": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.96.gate_proj.weight": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.96.gate_proj.weight_scale": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.96.up_proj.weight": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.96.up_proj.weight_scale": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.97.down_proj.weight": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.97.down_proj.weight_scale": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.97.gate_proj.weight": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.97.gate_proj.weight_scale": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.97.up_proj.weight": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.97.up_proj.weight_scale": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.98.down_proj.weight": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.98.down_proj.weight_scale": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.98.gate_proj.weight": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.98.gate_proj.weight_scale": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.98.up_proj.weight": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.98.up_proj.weight_scale": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.99.down_proj.weight": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.99.down_proj.weight_scale": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.99.gate_proj.weight": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.99.gate_proj.weight_scale": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.99.up_proj.weight": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.99.up_proj.weight_scale": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.gate.e_score_correction_bias": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.gate.weight": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.shared_experts.down_proj.weight": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.shared_experts.down_proj.weight_scale": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.shared_experts.gate_proj.weight": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.shared_experts.gate_proj.weight_scale": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.shared_experts.up_proj.weight": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.shared_experts.up_proj.weight_scale": "model-00041-of-00092.safetensors",
+ "model.layers.40.post_attention_layernorm.weight": "model-00041-of-00092.safetensors",
+ "model.layers.40.self_attn.k_norm.weight": "model-00041-of-00092.safetensors",
+ "model.layers.40.self_attn.k_proj.bias": "model-00041-of-00092.safetensors",
+ "model.layers.40.self_attn.k_proj.weight": "model-00041-of-00092.safetensors",
+ "model.layers.40.self_attn.k_proj.weight_scale": "model-00041-of-00092.safetensors",
+ "model.layers.40.self_attn.o_proj.weight": "model-00041-of-00092.safetensors",
+ "model.layers.40.self_attn.o_proj.weight_scale": "model-00041-of-00092.safetensors",
+ "model.layers.40.self_attn.q_norm.weight": "model-00041-of-00092.safetensors",
+ "model.layers.40.self_attn.q_proj.bias": "model-00041-of-00092.safetensors",
+ "model.layers.40.self_attn.q_proj.weight": "model-00041-of-00092.safetensors",
+ "model.layers.40.self_attn.q_proj.weight_scale": "model-00041-of-00092.safetensors",
+ "model.layers.40.self_attn.v_proj.bias": "model-00041-of-00092.safetensors",
+ "model.layers.40.self_attn.v_proj.weight": "model-00041-of-00092.safetensors",
+ "model.layers.40.self_attn.v_proj.weight_scale": "model-00041-of-00092.safetensors",
+ "model.layers.41.input_layernorm.weight": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.0.down_proj.weight": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.0.down_proj.weight_scale": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.0.gate_proj.weight": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.0.gate_proj.weight_scale": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.0.up_proj.weight": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.0.up_proj.weight_scale": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.1.down_proj.weight": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.1.down_proj.weight_scale": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.1.gate_proj.weight": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.1.gate_proj.weight_scale": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.1.up_proj.weight": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.1.up_proj.weight_scale": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.10.down_proj.weight": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.10.down_proj.weight_scale": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.10.gate_proj.weight": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.10.gate_proj.weight_scale": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.10.up_proj.weight": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.10.up_proj.weight_scale": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.100.down_proj.weight": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.100.down_proj.weight_scale": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.100.gate_proj.weight": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.100.gate_proj.weight_scale": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.100.up_proj.weight": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.100.up_proj.weight_scale": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.101.down_proj.weight": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.101.down_proj.weight_scale": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.101.gate_proj.weight": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.101.gate_proj.weight_scale": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.101.up_proj.weight": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.101.up_proj.weight_scale": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.102.down_proj.weight": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.102.down_proj.weight_scale": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.102.gate_proj.weight": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.102.gate_proj.weight_scale": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.102.up_proj.weight": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.102.up_proj.weight_scale": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.103.down_proj.weight": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.103.down_proj.weight_scale": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.103.gate_proj.weight": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.103.gate_proj.weight_scale": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.103.up_proj.weight": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.103.up_proj.weight_scale": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.104.down_proj.weight": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.104.down_proj.weight_scale": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.104.gate_proj.weight": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.104.gate_proj.weight_scale": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.104.up_proj.weight": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.104.up_proj.weight_scale": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.105.down_proj.weight": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.105.down_proj.weight_scale": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.105.gate_proj.weight": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.105.gate_proj.weight_scale": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.105.up_proj.weight": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.105.up_proj.weight_scale": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.106.down_proj.weight": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.106.down_proj.weight_scale": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.106.gate_proj.weight": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.106.gate_proj.weight_scale": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.106.up_proj.weight": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.106.up_proj.weight_scale": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.107.down_proj.weight": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.107.down_proj.weight_scale": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.107.gate_proj.weight": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.107.gate_proj.weight_scale": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.107.up_proj.weight": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.107.up_proj.weight_scale": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.108.down_proj.weight": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.108.down_proj.weight_scale": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.108.gate_proj.weight": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.108.gate_proj.weight_scale": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.108.up_proj.weight": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.108.up_proj.weight_scale": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.109.down_proj.weight": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.109.down_proj.weight_scale": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.109.gate_proj.weight": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.109.gate_proj.weight_scale": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.109.up_proj.weight": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.109.up_proj.weight_scale": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.11.down_proj.weight": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.11.down_proj.weight_scale": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.11.gate_proj.weight": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.11.gate_proj.weight_scale": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.11.up_proj.weight": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.11.up_proj.weight_scale": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.110.down_proj.weight": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.110.down_proj.weight_scale": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.110.gate_proj.weight": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.110.gate_proj.weight_scale": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.110.up_proj.weight": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.110.up_proj.weight_scale": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.111.down_proj.weight": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.111.down_proj.weight_scale": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.111.gate_proj.weight": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.111.gate_proj.weight_scale": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.111.up_proj.weight": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.111.up_proj.weight_scale": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.112.down_proj.weight": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.112.down_proj.weight_scale": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.112.gate_proj.weight": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.112.gate_proj.weight_scale": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.112.up_proj.weight": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.112.up_proj.weight_scale": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.113.down_proj.weight": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.113.down_proj.weight_scale": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.113.gate_proj.weight": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.113.gate_proj.weight_scale": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.113.up_proj.weight": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.113.up_proj.weight_scale": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.114.down_proj.weight": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.114.down_proj.weight_scale": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.114.gate_proj.weight": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.114.gate_proj.weight_scale": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.114.up_proj.weight": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.114.up_proj.weight_scale": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.115.down_proj.weight": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.115.down_proj.weight_scale": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.115.gate_proj.weight": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.115.gate_proj.weight_scale": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.115.up_proj.weight": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.115.up_proj.weight_scale": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.116.down_proj.weight": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.116.down_proj.weight_scale": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.116.gate_proj.weight": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.116.gate_proj.weight_scale": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.116.up_proj.weight": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.116.up_proj.weight_scale": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.117.down_proj.weight": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.117.down_proj.weight_scale": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.117.gate_proj.weight": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.117.gate_proj.weight_scale": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.117.up_proj.weight": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.117.up_proj.weight_scale": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.118.down_proj.weight": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.118.down_proj.weight_scale": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.118.gate_proj.weight": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.118.gate_proj.weight_scale": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.118.up_proj.weight": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.118.up_proj.weight_scale": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.119.down_proj.weight": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.119.down_proj.weight_scale": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.119.gate_proj.weight": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.119.gate_proj.weight_scale": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.119.up_proj.weight": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.119.up_proj.weight_scale": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.12.down_proj.weight": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.12.down_proj.weight_scale": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.12.gate_proj.weight": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.12.gate_proj.weight_scale": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.12.up_proj.weight": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.12.up_proj.weight_scale": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.120.down_proj.weight": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.120.down_proj.weight_scale": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.120.gate_proj.weight": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.120.gate_proj.weight_scale": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.120.up_proj.weight": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.120.up_proj.weight_scale": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.121.down_proj.weight": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.121.down_proj.weight_scale": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.121.gate_proj.weight": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.121.gate_proj.weight_scale": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.121.up_proj.weight": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.121.up_proj.weight_scale": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.122.down_proj.weight": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.122.down_proj.weight_scale": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.122.gate_proj.weight": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.122.gate_proj.weight_scale": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.122.up_proj.weight": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.122.up_proj.weight_scale": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.123.down_proj.weight": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.123.down_proj.weight_scale": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.123.gate_proj.weight": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.123.gate_proj.weight_scale": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.123.up_proj.weight": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.123.up_proj.weight_scale": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.124.down_proj.weight": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.124.down_proj.weight_scale": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.124.gate_proj.weight": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.124.gate_proj.weight_scale": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.124.up_proj.weight": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.124.up_proj.weight_scale": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.125.down_proj.weight": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.125.down_proj.weight_scale": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.125.gate_proj.weight": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.125.gate_proj.weight_scale": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.125.up_proj.weight": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.125.up_proj.weight_scale": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.126.down_proj.weight": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.126.down_proj.weight_scale": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.126.gate_proj.weight": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.126.gate_proj.weight_scale": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.126.up_proj.weight": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.126.up_proj.weight_scale": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.127.down_proj.weight": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.127.down_proj.weight_scale": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.127.gate_proj.weight": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.127.gate_proj.weight_scale": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.127.up_proj.weight": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.127.up_proj.weight_scale": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.128.down_proj.weight": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.128.down_proj.weight_scale": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.128.gate_proj.weight": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.128.gate_proj.weight_scale": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.128.up_proj.weight": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.128.up_proj.weight_scale": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.129.down_proj.weight": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.129.down_proj.weight_scale": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.129.gate_proj.weight": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.129.gate_proj.weight_scale": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.129.up_proj.weight": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.129.up_proj.weight_scale": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.13.down_proj.weight": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.13.down_proj.weight_scale": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.13.gate_proj.weight": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.13.gate_proj.weight_scale": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.13.up_proj.weight": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.13.up_proj.weight_scale": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.130.down_proj.weight": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.130.down_proj.weight_scale": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.130.gate_proj.weight": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.130.gate_proj.weight_scale": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.130.up_proj.weight": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.130.up_proj.weight_scale": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.131.down_proj.weight": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.131.down_proj.weight_scale": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.131.gate_proj.weight": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.131.gate_proj.weight_scale": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.131.up_proj.weight": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.131.up_proj.weight_scale": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.132.down_proj.weight": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.132.down_proj.weight_scale": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.132.gate_proj.weight": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.132.gate_proj.weight_scale": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.132.up_proj.weight": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.132.up_proj.weight_scale": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.133.down_proj.weight": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.133.down_proj.weight_scale": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.133.gate_proj.weight": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.133.gate_proj.weight_scale": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.133.up_proj.weight": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.133.up_proj.weight_scale": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.134.down_proj.weight": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.134.down_proj.weight_scale": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.134.gate_proj.weight": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.134.gate_proj.weight_scale": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.134.up_proj.weight": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.134.up_proj.weight_scale": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.135.down_proj.weight": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.135.down_proj.weight_scale": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.135.gate_proj.weight": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.135.gate_proj.weight_scale": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.135.up_proj.weight": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.135.up_proj.weight_scale": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.136.down_proj.weight": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.136.down_proj.weight_scale": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.136.gate_proj.weight": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.136.gate_proj.weight_scale": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.136.up_proj.weight": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.136.up_proj.weight_scale": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.137.down_proj.weight": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.137.down_proj.weight_scale": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.137.gate_proj.weight": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.137.gate_proj.weight_scale": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.137.up_proj.weight": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.137.up_proj.weight_scale": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.138.down_proj.weight": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.138.down_proj.weight_scale": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.138.gate_proj.weight": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.138.gate_proj.weight_scale": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.138.up_proj.weight": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.138.up_proj.weight_scale": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.139.down_proj.weight": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.139.down_proj.weight_scale": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.139.gate_proj.weight": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.139.gate_proj.weight_scale": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.139.up_proj.weight": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.139.up_proj.weight_scale": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.14.down_proj.weight": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.14.down_proj.weight_scale": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.14.gate_proj.weight": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.14.gate_proj.weight_scale": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.14.up_proj.weight": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.14.up_proj.weight_scale": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.140.down_proj.weight": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.140.down_proj.weight_scale": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.140.gate_proj.weight": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.140.gate_proj.weight_scale": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.140.up_proj.weight": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.140.up_proj.weight_scale": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.141.down_proj.weight": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.141.down_proj.weight_scale": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.141.gate_proj.weight": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.141.gate_proj.weight_scale": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.141.up_proj.weight": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.141.up_proj.weight_scale": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.142.down_proj.weight": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.142.down_proj.weight_scale": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.142.gate_proj.weight": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.142.gate_proj.weight_scale": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.142.up_proj.weight": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.142.up_proj.weight_scale": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.143.down_proj.weight": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.143.down_proj.weight_scale": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.143.gate_proj.weight": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.143.gate_proj.weight_scale": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.143.up_proj.weight": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.143.up_proj.weight_scale": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.144.down_proj.weight": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.144.down_proj.weight_scale": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.144.gate_proj.weight": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.144.gate_proj.weight_scale": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.144.up_proj.weight": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.144.up_proj.weight_scale": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.145.down_proj.weight": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.145.down_proj.weight_scale": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.145.gate_proj.weight": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.145.gate_proj.weight_scale": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.145.up_proj.weight": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.145.up_proj.weight_scale": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.146.down_proj.weight": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.146.down_proj.weight_scale": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.146.gate_proj.weight": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.146.gate_proj.weight_scale": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.146.up_proj.weight": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.146.up_proj.weight_scale": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.147.down_proj.weight": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.147.down_proj.weight_scale": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.147.gate_proj.weight": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.147.gate_proj.weight_scale": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.147.up_proj.weight": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.147.up_proj.weight_scale": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.148.down_proj.weight": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.148.down_proj.weight_scale": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.148.gate_proj.weight": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.148.gate_proj.weight_scale": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.148.up_proj.weight": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.148.up_proj.weight_scale": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.149.down_proj.weight": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.149.down_proj.weight_scale": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.149.gate_proj.weight": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.149.gate_proj.weight_scale": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.149.up_proj.weight": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.149.up_proj.weight_scale": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.15.down_proj.weight": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.15.down_proj.weight_scale": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.15.gate_proj.weight": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.15.gate_proj.weight_scale": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.15.up_proj.weight": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.15.up_proj.weight_scale": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.150.down_proj.weight": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.150.down_proj.weight_scale": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.150.gate_proj.weight": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.150.gate_proj.weight_scale": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.150.up_proj.weight": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.150.up_proj.weight_scale": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.151.down_proj.weight": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.151.down_proj.weight_scale": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.151.gate_proj.weight": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.151.gate_proj.weight_scale": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.151.up_proj.weight": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.151.up_proj.weight_scale": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.152.down_proj.weight": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.152.down_proj.weight_scale": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.152.gate_proj.weight": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.152.gate_proj.weight_scale": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.152.up_proj.weight": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.152.up_proj.weight_scale": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.153.down_proj.weight": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.153.down_proj.weight_scale": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.153.gate_proj.weight": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.153.gate_proj.weight_scale": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.153.up_proj.weight": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.153.up_proj.weight_scale": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.154.down_proj.weight": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.154.down_proj.weight_scale": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.154.gate_proj.weight": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.154.gate_proj.weight_scale": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.154.up_proj.weight": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.154.up_proj.weight_scale": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.155.down_proj.weight": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.155.down_proj.weight_scale": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.155.gate_proj.weight": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.155.gate_proj.weight_scale": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.155.up_proj.weight": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.155.up_proj.weight_scale": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.156.down_proj.weight": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.156.down_proj.weight_scale": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.156.gate_proj.weight": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.156.gate_proj.weight_scale": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.156.up_proj.weight": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.156.up_proj.weight_scale": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.157.down_proj.weight": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.157.down_proj.weight_scale": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.157.gate_proj.weight": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.157.gate_proj.weight_scale": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.157.up_proj.weight": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.157.up_proj.weight_scale": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.158.down_proj.weight": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.158.down_proj.weight_scale": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.158.gate_proj.weight": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.158.gate_proj.weight_scale": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.158.up_proj.weight": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.158.up_proj.weight_scale": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.159.down_proj.weight": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.159.down_proj.weight_scale": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.159.gate_proj.weight": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.159.gate_proj.weight_scale": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.159.up_proj.weight": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.159.up_proj.weight_scale": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.16.down_proj.weight": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.16.down_proj.weight_scale": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.16.gate_proj.weight": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.16.gate_proj.weight_scale": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.16.up_proj.weight": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.16.up_proj.weight_scale": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.17.down_proj.weight": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.17.down_proj.weight_scale": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.17.gate_proj.weight": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.17.gate_proj.weight_scale": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.17.up_proj.weight": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.17.up_proj.weight_scale": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.18.down_proj.weight": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.18.down_proj.weight_scale": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.18.gate_proj.weight": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.18.gate_proj.weight_scale": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.18.up_proj.weight": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.18.up_proj.weight_scale": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.19.down_proj.weight": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.19.down_proj.weight_scale": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.19.gate_proj.weight": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.19.gate_proj.weight_scale": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.19.up_proj.weight": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.19.up_proj.weight_scale": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.2.down_proj.weight": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.2.down_proj.weight_scale": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.2.gate_proj.weight": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.2.gate_proj.weight_scale": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.2.up_proj.weight": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.2.up_proj.weight_scale": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.20.down_proj.weight": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.20.down_proj.weight_scale": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.20.gate_proj.weight": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.20.gate_proj.weight_scale": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.20.up_proj.weight": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.20.up_proj.weight_scale": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.21.down_proj.weight": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.21.down_proj.weight_scale": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.21.gate_proj.weight": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.21.gate_proj.weight_scale": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.21.up_proj.weight": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.21.up_proj.weight_scale": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.22.down_proj.weight": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.22.down_proj.weight_scale": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.22.gate_proj.weight": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.22.gate_proj.weight_scale": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.22.up_proj.weight": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.22.up_proj.weight_scale": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.23.down_proj.weight": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.23.down_proj.weight_scale": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.23.gate_proj.weight": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.23.gate_proj.weight_scale": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.23.up_proj.weight": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.23.up_proj.weight_scale": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.24.down_proj.weight": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.24.down_proj.weight_scale": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.24.gate_proj.weight": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.24.gate_proj.weight_scale": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.24.up_proj.weight": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.24.up_proj.weight_scale": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.25.down_proj.weight": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.25.down_proj.weight_scale": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.25.gate_proj.weight": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.25.gate_proj.weight_scale": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.25.up_proj.weight": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.25.up_proj.weight_scale": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.26.down_proj.weight": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.26.down_proj.weight_scale": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.26.gate_proj.weight": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.26.gate_proj.weight_scale": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.26.up_proj.weight": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.26.up_proj.weight_scale": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.27.down_proj.weight": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.27.down_proj.weight_scale": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.27.gate_proj.weight": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.27.gate_proj.weight_scale": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.27.up_proj.weight": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.27.up_proj.weight_scale": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.28.down_proj.weight": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.28.down_proj.weight_scale": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.28.gate_proj.weight": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.28.gate_proj.weight_scale": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.28.up_proj.weight": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.28.up_proj.weight_scale": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.29.down_proj.weight": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.29.down_proj.weight_scale": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.29.gate_proj.weight": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.29.gate_proj.weight_scale": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.29.up_proj.weight": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.29.up_proj.weight_scale": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.3.down_proj.weight": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.3.down_proj.weight_scale": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.3.gate_proj.weight": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.3.gate_proj.weight_scale": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.3.up_proj.weight": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.3.up_proj.weight_scale": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.30.down_proj.weight": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.30.down_proj.weight_scale": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.30.gate_proj.weight": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.30.gate_proj.weight_scale": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.30.up_proj.weight": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.30.up_proj.weight_scale": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.31.down_proj.weight": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.31.down_proj.weight_scale": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.31.gate_proj.weight": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.31.gate_proj.weight_scale": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.31.up_proj.weight": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.31.up_proj.weight_scale": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.32.down_proj.weight": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.32.down_proj.weight_scale": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.32.gate_proj.weight": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.32.gate_proj.weight_scale": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.32.up_proj.weight": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.32.up_proj.weight_scale": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.33.down_proj.weight": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.33.down_proj.weight_scale": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.33.gate_proj.weight": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.33.gate_proj.weight_scale": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.33.up_proj.weight": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.33.up_proj.weight_scale": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.34.down_proj.weight": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.34.down_proj.weight_scale": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.34.gate_proj.weight": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.34.gate_proj.weight_scale": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.34.up_proj.weight": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.34.up_proj.weight_scale": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.35.down_proj.weight": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.35.down_proj.weight_scale": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.35.gate_proj.weight": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.35.gate_proj.weight_scale": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.35.up_proj.weight": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.35.up_proj.weight_scale": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.36.down_proj.weight": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.36.down_proj.weight_scale": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.36.gate_proj.weight": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.36.gate_proj.weight_scale": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.36.up_proj.weight": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.36.up_proj.weight_scale": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.37.down_proj.weight": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.37.down_proj.weight_scale": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.37.gate_proj.weight": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.37.gate_proj.weight_scale": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.37.up_proj.weight": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.37.up_proj.weight_scale": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.38.down_proj.weight": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.38.down_proj.weight_scale": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.38.gate_proj.weight": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.38.gate_proj.weight_scale": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.38.up_proj.weight": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.38.up_proj.weight_scale": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.39.down_proj.weight": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.39.down_proj.weight_scale": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.39.gate_proj.weight": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.39.gate_proj.weight_scale": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.39.up_proj.weight": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.39.up_proj.weight_scale": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.4.down_proj.weight": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.4.down_proj.weight_scale": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.4.gate_proj.weight": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.4.gate_proj.weight_scale": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.4.up_proj.weight": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.4.up_proj.weight_scale": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.40.down_proj.weight": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.40.down_proj.weight_scale": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.40.gate_proj.weight": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.40.gate_proj.weight_scale": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.40.up_proj.weight": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.40.up_proj.weight_scale": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.41.down_proj.weight": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.41.down_proj.weight_scale": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.41.gate_proj.weight": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.41.gate_proj.weight_scale": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.41.up_proj.weight": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.41.up_proj.weight_scale": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.42.down_proj.weight": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.42.down_proj.weight_scale": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.42.gate_proj.weight": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.42.gate_proj.weight_scale": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.42.up_proj.weight": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.42.up_proj.weight_scale": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.43.down_proj.weight": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.43.down_proj.weight_scale": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.43.gate_proj.weight": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.43.gate_proj.weight_scale": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.43.up_proj.weight": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.43.up_proj.weight_scale": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.44.down_proj.weight": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.44.down_proj.weight_scale": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.44.gate_proj.weight": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.44.gate_proj.weight_scale": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.44.up_proj.weight": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.44.up_proj.weight_scale": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.45.down_proj.weight": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.45.down_proj.weight_scale": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.45.gate_proj.weight": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.45.gate_proj.weight_scale": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.45.up_proj.weight": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.45.up_proj.weight_scale": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.46.down_proj.weight": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.46.down_proj.weight_scale": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.46.gate_proj.weight": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.46.gate_proj.weight_scale": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.46.up_proj.weight": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.46.up_proj.weight_scale": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.47.down_proj.weight": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.47.down_proj.weight_scale": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.47.gate_proj.weight": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.47.gate_proj.weight_scale": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.47.up_proj.weight": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.47.up_proj.weight_scale": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.48.down_proj.weight": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.48.down_proj.weight_scale": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.48.gate_proj.weight": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.48.gate_proj.weight_scale": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.48.up_proj.weight": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.48.up_proj.weight_scale": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.49.down_proj.weight": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.49.down_proj.weight_scale": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.49.gate_proj.weight": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.49.gate_proj.weight_scale": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.49.up_proj.weight": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.49.up_proj.weight_scale": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.5.down_proj.weight": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.5.down_proj.weight_scale": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.5.gate_proj.weight": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.5.gate_proj.weight_scale": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.5.up_proj.weight": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.5.up_proj.weight_scale": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.50.down_proj.weight": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.50.down_proj.weight_scale": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.50.gate_proj.weight": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.50.gate_proj.weight_scale": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.50.up_proj.weight": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.50.up_proj.weight_scale": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.51.down_proj.weight": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.51.down_proj.weight_scale": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.51.gate_proj.weight": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.51.gate_proj.weight_scale": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.51.up_proj.weight": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.51.up_proj.weight_scale": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.52.down_proj.weight": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.52.down_proj.weight_scale": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.52.gate_proj.weight": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.52.gate_proj.weight_scale": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.52.up_proj.weight": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.52.up_proj.weight_scale": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.53.down_proj.weight": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.53.down_proj.weight_scale": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.53.gate_proj.weight": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.53.gate_proj.weight_scale": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.53.up_proj.weight": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.53.up_proj.weight_scale": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.54.down_proj.weight": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.54.down_proj.weight_scale": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.54.gate_proj.weight": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.54.gate_proj.weight_scale": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.54.up_proj.weight": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.54.up_proj.weight_scale": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.55.down_proj.weight": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.55.down_proj.weight_scale": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.55.gate_proj.weight": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.55.gate_proj.weight_scale": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.55.up_proj.weight": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.55.up_proj.weight_scale": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.56.down_proj.weight": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.56.down_proj.weight_scale": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.56.gate_proj.weight": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.56.gate_proj.weight_scale": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.56.up_proj.weight": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.56.up_proj.weight_scale": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.57.down_proj.weight": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.57.down_proj.weight_scale": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.57.gate_proj.weight": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.57.gate_proj.weight_scale": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.57.up_proj.weight": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.57.up_proj.weight_scale": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.58.down_proj.weight": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.58.down_proj.weight_scale": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.58.gate_proj.weight": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.58.gate_proj.weight_scale": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.58.up_proj.weight": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.58.up_proj.weight_scale": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.59.down_proj.weight": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.59.down_proj.weight_scale": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.59.gate_proj.weight": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.59.gate_proj.weight_scale": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.59.up_proj.weight": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.59.up_proj.weight_scale": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.6.down_proj.weight": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.6.down_proj.weight_scale": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.6.gate_proj.weight": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.6.gate_proj.weight_scale": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.6.up_proj.weight": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.6.up_proj.weight_scale": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.60.down_proj.weight": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.60.down_proj.weight_scale": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.60.gate_proj.weight": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.60.gate_proj.weight_scale": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.60.up_proj.weight": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.60.up_proj.weight_scale": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.61.down_proj.weight": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.61.down_proj.weight_scale": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.61.gate_proj.weight": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.61.gate_proj.weight_scale": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.61.up_proj.weight": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.61.up_proj.weight_scale": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.62.down_proj.weight": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.62.down_proj.weight_scale": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.62.gate_proj.weight": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.62.gate_proj.weight_scale": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.62.up_proj.weight": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.62.up_proj.weight_scale": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.63.down_proj.weight": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.63.down_proj.weight_scale": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.63.gate_proj.weight": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.63.gate_proj.weight_scale": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.63.up_proj.weight": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.63.up_proj.weight_scale": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.64.down_proj.weight": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.64.down_proj.weight_scale": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.64.gate_proj.weight": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.64.gate_proj.weight_scale": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.64.up_proj.weight": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.64.up_proj.weight_scale": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.65.down_proj.weight": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.65.down_proj.weight_scale": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.65.gate_proj.weight": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.65.gate_proj.weight_scale": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.65.up_proj.weight": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.65.up_proj.weight_scale": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.66.down_proj.weight": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.66.down_proj.weight_scale": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.66.gate_proj.weight": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.66.gate_proj.weight_scale": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.66.up_proj.weight": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.66.up_proj.weight_scale": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.67.down_proj.weight": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.67.down_proj.weight_scale": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.67.gate_proj.weight": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.67.gate_proj.weight_scale": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.67.up_proj.weight": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.67.up_proj.weight_scale": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.68.down_proj.weight": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.68.down_proj.weight_scale": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.68.gate_proj.weight": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.68.gate_proj.weight_scale": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.68.up_proj.weight": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.68.up_proj.weight_scale": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.69.down_proj.weight": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.69.down_proj.weight_scale": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.69.gate_proj.weight": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.69.gate_proj.weight_scale": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.69.up_proj.weight": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.69.up_proj.weight_scale": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.7.down_proj.weight": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.7.down_proj.weight_scale": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.7.gate_proj.weight": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.7.gate_proj.weight_scale": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.7.up_proj.weight": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.7.up_proj.weight_scale": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.70.down_proj.weight": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.70.down_proj.weight_scale": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.70.gate_proj.weight": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.70.gate_proj.weight_scale": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.70.up_proj.weight": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.70.up_proj.weight_scale": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.71.down_proj.weight": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.71.down_proj.weight_scale": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.71.gate_proj.weight": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.71.gate_proj.weight_scale": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.71.up_proj.weight": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.71.up_proj.weight_scale": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.72.down_proj.weight": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.72.down_proj.weight_scale": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.72.gate_proj.weight": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.72.gate_proj.weight_scale": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.72.up_proj.weight": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.72.up_proj.weight_scale": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.73.down_proj.weight": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.73.down_proj.weight_scale": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.73.gate_proj.weight": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.73.gate_proj.weight_scale": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.73.up_proj.weight": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.73.up_proj.weight_scale": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.74.down_proj.weight": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.74.down_proj.weight_scale": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.74.gate_proj.weight": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.74.gate_proj.weight_scale": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.74.up_proj.weight": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.74.up_proj.weight_scale": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.75.down_proj.weight": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.75.down_proj.weight_scale": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.75.gate_proj.weight": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.75.gate_proj.weight_scale": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.75.up_proj.weight": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.75.up_proj.weight_scale": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.76.down_proj.weight": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.76.down_proj.weight_scale": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.76.gate_proj.weight": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.76.gate_proj.weight_scale": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.76.up_proj.weight": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.76.up_proj.weight_scale": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.77.down_proj.weight": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.77.down_proj.weight_scale": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.77.gate_proj.weight": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.77.gate_proj.weight_scale": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.77.up_proj.weight": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.77.up_proj.weight_scale": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.78.down_proj.weight": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.78.down_proj.weight_scale": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.78.gate_proj.weight": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.78.gate_proj.weight_scale": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.78.up_proj.weight": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.78.up_proj.weight_scale": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.79.down_proj.weight": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.79.down_proj.weight_scale": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.79.gate_proj.weight": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.79.gate_proj.weight_scale": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.79.up_proj.weight": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.79.up_proj.weight_scale": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.8.down_proj.weight": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.8.down_proj.weight_scale": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.8.gate_proj.weight": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.8.gate_proj.weight_scale": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.8.up_proj.weight": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.8.up_proj.weight_scale": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.80.down_proj.weight": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.80.down_proj.weight_scale": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.80.gate_proj.weight": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.80.gate_proj.weight_scale": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.80.up_proj.weight": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.80.up_proj.weight_scale": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.81.down_proj.weight": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.81.down_proj.weight_scale": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.81.gate_proj.weight": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.81.gate_proj.weight_scale": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.81.up_proj.weight": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.81.up_proj.weight_scale": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.82.down_proj.weight": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.82.down_proj.weight_scale": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.82.gate_proj.weight": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.82.gate_proj.weight_scale": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.82.up_proj.weight": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.82.up_proj.weight_scale": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.83.down_proj.weight": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.83.down_proj.weight_scale": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.83.gate_proj.weight": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.83.gate_proj.weight_scale": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.83.up_proj.weight": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.83.up_proj.weight_scale": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.84.down_proj.weight": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.84.down_proj.weight_scale": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.84.gate_proj.weight": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.84.gate_proj.weight_scale": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.84.up_proj.weight": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.84.up_proj.weight_scale": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.85.down_proj.weight": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.85.down_proj.weight_scale": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.85.gate_proj.weight": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.85.gate_proj.weight_scale": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.85.up_proj.weight": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.85.up_proj.weight_scale": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.86.down_proj.weight": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.86.down_proj.weight_scale": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.86.gate_proj.weight": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.86.gate_proj.weight_scale": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.86.up_proj.weight": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.86.up_proj.weight_scale": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.87.down_proj.weight": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.87.down_proj.weight_scale": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.87.gate_proj.weight": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.87.gate_proj.weight_scale": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.87.up_proj.weight": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.87.up_proj.weight_scale": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.88.down_proj.weight": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.88.down_proj.weight_scale": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.88.gate_proj.weight": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.88.gate_proj.weight_scale": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.88.up_proj.weight": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.88.up_proj.weight_scale": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.89.down_proj.weight": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.89.down_proj.weight_scale": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.89.gate_proj.weight": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.89.gate_proj.weight_scale": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.89.up_proj.weight": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.89.up_proj.weight_scale": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.9.down_proj.weight": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.9.down_proj.weight_scale": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.9.gate_proj.weight": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.9.gate_proj.weight_scale": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.9.up_proj.weight": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.9.up_proj.weight_scale": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.90.down_proj.weight": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.90.down_proj.weight_scale": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.90.gate_proj.weight": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.90.gate_proj.weight_scale": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.90.up_proj.weight": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.90.up_proj.weight_scale": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.91.down_proj.weight": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.91.down_proj.weight_scale": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.91.gate_proj.weight": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.91.gate_proj.weight_scale": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.91.up_proj.weight": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.91.up_proj.weight_scale": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.92.down_proj.weight": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.92.down_proj.weight_scale": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.92.gate_proj.weight": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.92.gate_proj.weight_scale": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.92.up_proj.weight": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.92.up_proj.weight_scale": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.93.down_proj.weight": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.93.down_proj.weight_scale": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.93.gate_proj.weight": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.93.gate_proj.weight_scale": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.93.up_proj.weight": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.93.up_proj.weight_scale": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.94.down_proj.weight": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.94.down_proj.weight_scale": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.94.gate_proj.weight": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.94.gate_proj.weight_scale": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.94.up_proj.weight": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.94.up_proj.weight_scale": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.95.down_proj.weight": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.95.down_proj.weight_scale": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.95.gate_proj.weight": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.95.gate_proj.weight_scale": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.95.up_proj.weight": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.95.up_proj.weight_scale": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.96.down_proj.weight": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.96.down_proj.weight_scale": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.96.gate_proj.weight": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.96.gate_proj.weight_scale": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.96.up_proj.weight": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.96.up_proj.weight_scale": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.97.down_proj.weight": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.97.down_proj.weight_scale": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.97.gate_proj.weight": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.97.gate_proj.weight_scale": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.97.up_proj.weight": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.97.up_proj.weight_scale": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.98.down_proj.weight": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.98.down_proj.weight_scale": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.98.gate_proj.weight": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.98.gate_proj.weight_scale": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.98.up_proj.weight": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.98.up_proj.weight_scale": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.99.down_proj.weight": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.99.down_proj.weight_scale": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.99.gate_proj.weight": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.99.gate_proj.weight_scale": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.99.up_proj.weight": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.99.up_proj.weight_scale": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.gate.e_score_correction_bias": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.gate.weight": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.shared_experts.down_proj.weight": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.shared_experts.down_proj.weight_scale": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.shared_experts.gate_proj.weight": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.shared_experts.gate_proj.weight_scale": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.shared_experts.up_proj.weight": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.shared_experts.up_proj.weight_scale": "model-00042-of-00092.safetensors",
+ "model.layers.41.post_attention_layernorm.weight": "model-00042-of-00092.safetensors",
+ "model.layers.41.self_attn.k_norm.weight": "model-00042-of-00092.safetensors",
+ "model.layers.41.self_attn.k_proj.bias": "model-00042-of-00092.safetensors",
+ "model.layers.41.self_attn.k_proj.weight": "model-00042-of-00092.safetensors",
+ "model.layers.41.self_attn.k_proj.weight_scale": "model-00042-of-00092.safetensors",
+ "model.layers.41.self_attn.o_proj.weight": "model-00042-of-00092.safetensors",
+ "model.layers.41.self_attn.o_proj.weight_scale": "model-00042-of-00092.safetensors",
+ "model.layers.41.self_attn.q_norm.weight": "model-00042-of-00092.safetensors",
+ "model.layers.41.self_attn.q_proj.bias": "model-00042-of-00092.safetensors",
+ "model.layers.41.self_attn.q_proj.weight": "model-00042-of-00092.safetensors",
+ "model.layers.41.self_attn.q_proj.weight_scale": "model-00042-of-00092.safetensors",
+ "model.layers.41.self_attn.v_proj.bias": "model-00042-of-00092.safetensors",
+ "model.layers.41.self_attn.v_proj.weight": "model-00042-of-00092.safetensors",
+ "model.layers.41.self_attn.v_proj.weight_scale": "model-00042-of-00092.safetensors",
+ "model.layers.42.input_layernorm.weight": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.0.down_proj.weight": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.0.down_proj.weight_scale": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.0.gate_proj.weight": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.0.gate_proj.weight_scale": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.0.up_proj.weight": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.0.up_proj.weight_scale": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.1.down_proj.weight": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.1.down_proj.weight_scale": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.1.gate_proj.weight": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.1.gate_proj.weight_scale": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.1.up_proj.weight": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.1.up_proj.weight_scale": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.10.down_proj.weight": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.10.down_proj.weight_scale": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.10.gate_proj.weight": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.10.gate_proj.weight_scale": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.10.up_proj.weight": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.10.up_proj.weight_scale": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.100.down_proj.weight": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.100.down_proj.weight_scale": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.100.gate_proj.weight": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.100.gate_proj.weight_scale": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.100.up_proj.weight": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.100.up_proj.weight_scale": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.101.down_proj.weight": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.101.down_proj.weight_scale": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.101.gate_proj.weight": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.101.gate_proj.weight_scale": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.101.up_proj.weight": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.101.up_proj.weight_scale": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.102.down_proj.weight": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.102.down_proj.weight_scale": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.102.gate_proj.weight": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.102.gate_proj.weight_scale": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.102.up_proj.weight": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.102.up_proj.weight_scale": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.103.down_proj.weight": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.103.down_proj.weight_scale": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.103.gate_proj.weight": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.103.gate_proj.weight_scale": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.103.up_proj.weight": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.103.up_proj.weight_scale": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.104.down_proj.weight": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.104.down_proj.weight_scale": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.104.gate_proj.weight": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.104.gate_proj.weight_scale": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.104.up_proj.weight": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.104.up_proj.weight_scale": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.105.down_proj.weight": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.105.down_proj.weight_scale": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.105.gate_proj.weight": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.105.gate_proj.weight_scale": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.105.up_proj.weight": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.105.up_proj.weight_scale": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.106.down_proj.weight": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.106.down_proj.weight_scale": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.106.gate_proj.weight": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.106.gate_proj.weight_scale": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.106.up_proj.weight": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.106.up_proj.weight_scale": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.107.down_proj.weight": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.107.down_proj.weight_scale": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.107.gate_proj.weight": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.107.gate_proj.weight_scale": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.107.up_proj.weight": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.107.up_proj.weight_scale": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.108.down_proj.weight": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.108.down_proj.weight_scale": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.108.gate_proj.weight": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.108.gate_proj.weight_scale": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.108.up_proj.weight": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.108.up_proj.weight_scale": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.109.down_proj.weight": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.109.down_proj.weight_scale": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.109.gate_proj.weight": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.109.gate_proj.weight_scale": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.109.up_proj.weight": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.109.up_proj.weight_scale": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.11.down_proj.weight": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.11.down_proj.weight_scale": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.11.gate_proj.weight": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.11.gate_proj.weight_scale": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.11.up_proj.weight": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.11.up_proj.weight_scale": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.110.down_proj.weight": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.110.down_proj.weight_scale": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.110.gate_proj.weight": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.110.gate_proj.weight_scale": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.110.up_proj.weight": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.110.up_proj.weight_scale": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.111.down_proj.weight": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.111.down_proj.weight_scale": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.111.gate_proj.weight": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.111.gate_proj.weight_scale": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.111.up_proj.weight": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.111.up_proj.weight_scale": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.112.down_proj.weight": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.112.down_proj.weight_scale": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.112.gate_proj.weight": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.112.gate_proj.weight_scale": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.112.up_proj.weight": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.112.up_proj.weight_scale": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.113.down_proj.weight": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.113.down_proj.weight_scale": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.113.gate_proj.weight": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.113.gate_proj.weight_scale": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.113.up_proj.weight": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.113.up_proj.weight_scale": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.114.down_proj.weight": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.114.down_proj.weight_scale": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.114.gate_proj.weight": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.114.gate_proj.weight_scale": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.114.up_proj.weight": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.114.up_proj.weight_scale": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.115.down_proj.weight": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.115.down_proj.weight_scale": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.115.gate_proj.weight": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.115.gate_proj.weight_scale": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.115.up_proj.weight": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.115.up_proj.weight_scale": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.116.down_proj.weight": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.116.down_proj.weight_scale": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.116.gate_proj.weight": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.116.gate_proj.weight_scale": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.116.up_proj.weight": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.116.up_proj.weight_scale": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.117.down_proj.weight": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.117.down_proj.weight_scale": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.117.gate_proj.weight": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.117.gate_proj.weight_scale": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.117.up_proj.weight": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.117.up_proj.weight_scale": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.118.down_proj.weight": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.118.down_proj.weight_scale": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.118.gate_proj.weight": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.118.gate_proj.weight_scale": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.118.up_proj.weight": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.118.up_proj.weight_scale": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.119.down_proj.weight": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.119.down_proj.weight_scale": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.119.gate_proj.weight": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.119.gate_proj.weight_scale": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.119.up_proj.weight": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.119.up_proj.weight_scale": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.12.down_proj.weight": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.12.down_proj.weight_scale": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.12.gate_proj.weight": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.12.gate_proj.weight_scale": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.12.up_proj.weight": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.12.up_proj.weight_scale": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.120.down_proj.weight": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.120.down_proj.weight_scale": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.120.gate_proj.weight": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.120.gate_proj.weight_scale": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.120.up_proj.weight": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.120.up_proj.weight_scale": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.121.down_proj.weight": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.121.down_proj.weight_scale": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.121.gate_proj.weight": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.121.gate_proj.weight_scale": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.121.up_proj.weight": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.121.up_proj.weight_scale": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.122.down_proj.weight": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.122.down_proj.weight_scale": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.122.gate_proj.weight": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.122.gate_proj.weight_scale": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.122.up_proj.weight": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.122.up_proj.weight_scale": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.123.down_proj.weight": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.123.down_proj.weight_scale": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.123.gate_proj.weight": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.123.gate_proj.weight_scale": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.123.up_proj.weight": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.123.up_proj.weight_scale": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.124.down_proj.weight": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.124.down_proj.weight_scale": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.124.gate_proj.weight": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.124.gate_proj.weight_scale": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.124.up_proj.weight": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.124.up_proj.weight_scale": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.125.down_proj.weight": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.125.down_proj.weight_scale": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.125.gate_proj.weight": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.125.gate_proj.weight_scale": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.125.up_proj.weight": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.125.up_proj.weight_scale": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.126.down_proj.weight": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.126.down_proj.weight_scale": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.126.gate_proj.weight": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.126.gate_proj.weight_scale": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.126.up_proj.weight": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.126.up_proj.weight_scale": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.127.down_proj.weight": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.127.down_proj.weight_scale": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.127.gate_proj.weight": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.127.gate_proj.weight_scale": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.127.up_proj.weight": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.127.up_proj.weight_scale": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.128.down_proj.weight": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.128.down_proj.weight_scale": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.128.gate_proj.weight": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.128.gate_proj.weight_scale": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.128.up_proj.weight": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.128.up_proj.weight_scale": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.129.down_proj.weight": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.129.down_proj.weight_scale": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.129.gate_proj.weight": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.129.gate_proj.weight_scale": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.129.up_proj.weight": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.129.up_proj.weight_scale": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.13.down_proj.weight": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.13.down_proj.weight_scale": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.13.gate_proj.weight": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.13.gate_proj.weight_scale": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.13.up_proj.weight": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.13.up_proj.weight_scale": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.130.down_proj.weight": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.130.down_proj.weight_scale": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.130.gate_proj.weight": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.130.gate_proj.weight_scale": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.130.up_proj.weight": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.130.up_proj.weight_scale": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.131.down_proj.weight": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.131.down_proj.weight_scale": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.131.gate_proj.weight": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.131.gate_proj.weight_scale": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.131.up_proj.weight": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.131.up_proj.weight_scale": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.132.down_proj.weight": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.132.down_proj.weight_scale": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.132.gate_proj.weight": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.132.gate_proj.weight_scale": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.132.up_proj.weight": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.132.up_proj.weight_scale": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.133.down_proj.weight": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.133.down_proj.weight_scale": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.133.gate_proj.weight": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.133.gate_proj.weight_scale": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.133.up_proj.weight": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.133.up_proj.weight_scale": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.134.down_proj.weight": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.134.down_proj.weight_scale": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.134.gate_proj.weight": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.134.gate_proj.weight_scale": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.134.up_proj.weight": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.134.up_proj.weight_scale": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.135.down_proj.weight": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.135.down_proj.weight_scale": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.135.gate_proj.weight": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.135.gate_proj.weight_scale": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.135.up_proj.weight": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.135.up_proj.weight_scale": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.136.down_proj.weight": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.136.down_proj.weight_scale": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.136.gate_proj.weight": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.136.gate_proj.weight_scale": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.136.up_proj.weight": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.136.up_proj.weight_scale": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.137.down_proj.weight": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.137.down_proj.weight_scale": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.137.gate_proj.weight": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.137.gate_proj.weight_scale": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.137.up_proj.weight": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.137.up_proj.weight_scale": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.138.down_proj.weight": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.138.down_proj.weight_scale": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.138.gate_proj.weight": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.138.gate_proj.weight_scale": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.138.up_proj.weight": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.138.up_proj.weight_scale": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.139.down_proj.weight": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.139.down_proj.weight_scale": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.139.gate_proj.weight": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.139.gate_proj.weight_scale": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.139.up_proj.weight": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.139.up_proj.weight_scale": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.14.down_proj.weight": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.14.down_proj.weight_scale": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.14.gate_proj.weight": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.14.gate_proj.weight_scale": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.14.up_proj.weight": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.14.up_proj.weight_scale": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.140.down_proj.weight": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.140.down_proj.weight_scale": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.140.gate_proj.weight": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.140.gate_proj.weight_scale": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.140.up_proj.weight": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.140.up_proj.weight_scale": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.141.down_proj.weight": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.141.down_proj.weight_scale": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.141.gate_proj.weight": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.141.gate_proj.weight_scale": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.141.up_proj.weight": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.141.up_proj.weight_scale": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.142.down_proj.weight": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.142.down_proj.weight_scale": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.142.gate_proj.weight": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.142.gate_proj.weight_scale": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.142.up_proj.weight": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.142.up_proj.weight_scale": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.143.down_proj.weight": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.143.down_proj.weight_scale": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.143.gate_proj.weight": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.143.gate_proj.weight_scale": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.143.up_proj.weight": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.143.up_proj.weight_scale": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.144.down_proj.weight": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.144.down_proj.weight_scale": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.144.gate_proj.weight": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.144.gate_proj.weight_scale": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.144.up_proj.weight": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.144.up_proj.weight_scale": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.145.down_proj.weight": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.145.down_proj.weight_scale": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.145.gate_proj.weight": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.145.gate_proj.weight_scale": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.145.up_proj.weight": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.145.up_proj.weight_scale": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.146.down_proj.weight": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.146.down_proj.weight_scale": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.146.gate_proj.weight": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.146.gate_proj.weight_scale": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.146.up_proj.weight": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.146.up_proj.weight_scale": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.147.down_proj.weight": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.147.down_proj.weight_scale": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.147.gate_proj.weight": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.147.gate_proj.weight_scale": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.147.up_proj.weight": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.147.up_proj.weight_scale": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.148.down_proj.weight": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.148.down_proj.weight_scale": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.148.gate_proj.weight": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.148.gate_proj.weight_scale": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.148.up_proj.weight": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.148.up_proj.weight_scale": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.149.down_proj.weight": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.149.down_proj.weight_scale": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.149.gate_proj.weight": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.149.gate_proj.weight_scale": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.149.up_proj.weight": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.149.up_proj.weight_scale": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.15.down_proj.weight": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.15.down_proj.weight_scale": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.15.gate_proj.weight": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.15.gate_proj.weight_scale": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.15.up_proj.weight": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.15.up_proj.weight_scale": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.150.down_proj.weight": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.150.down_proj.weight_scale": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.150.gate_proj.weight": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.150.gate_proj.weight_scale": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.150.up_proj.weight": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.150.up_proj.weight_scale": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.151.down_proj.weight": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.151.down_proj.weight_scale": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.151.gate_proj.weight": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.151.gate_proj.weight_scale": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.151.up_proj.weight": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.151.up_proj.weight_scale": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.152.down_proj.weight": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.152.down_proj.weight_scale": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.152.gate_proj.weight": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.152.gate_proj.weight_scale": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.152.up_proj.weight": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.152.up_proj.weight_scale": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.153.down_proj.weight": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.153.down_proj.weight_scale": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.153.gate_proj.weight": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.153.gate_proj.weight_scale": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.153.up_proj.weight": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.153.up_proj.weight_scale": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.154.down_proj.weight": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.154.down_proj.weight_scale": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.154.gate_proj.weight": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.154.gate_proj.weight_scale": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.154.up_proj.weight": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.154.up_proj.weight_scale": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.155.down_proj.weight": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.155.down_proj.weight_scale": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.155.gate_proj.weight": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.155.gate_proj.weight_scale": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.155.up_proj.weight": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.155.up_proj.weight_scale": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.156.down_proj.weight": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.156.down_proj.weight_scale": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.156.gate_proj.weight": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.156.gate_proj.weight_scale": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.156.up_proj.weight": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.156.up_proj.weight_scale": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.157.down_proj.weight": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.157.down_proj.weight_scale": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.157.gate_proj.weight": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.157.gate_proj.weight_scale": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.157.up_proj.weight": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.157.up_proj.weight_scale": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.158.down_proj.weight": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.158.down_proj.weight_scale": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.158.gate_proj.weight": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.158.gate_proj.weight_scale": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.158.up_proj.weight": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.158.up_proj.weight_scale": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.159.down_proj.weight": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.159.down_proj.weight_scale": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.159.gate_proj.weight": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.159.gate_proj.weight_scale": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.159.up_proj.weight": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.159.up_proj.weight_scale": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.16.down_proj.weight": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.16.down_proj.weight_scale": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.16.gate_proj.weight": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.16.gate_proj.weight_scale": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.16.up_proj.weight": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.16.up_proj.weight_scale": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.17.down_proj.weight": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.17.down_proj.weight_scale": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.17.gate_proj.weight": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.17.gate_proj.weight_scale": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.17.up_proj.weight": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.17.up_proj.weight_scale": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.18.down_proj.weight": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.18.down_proj.weight_scale": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.18.gate_proj.weight": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.18.gate_proj.weight_scale": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.18.up_proj.weight": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.18.up_proj.weight_scale": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.19.down_proj.weight": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.19.down_proj.weight_scale": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.19.gate_proj.weight": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.19.gate_proj.weight_scale": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.19.up_proj.weight": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.19.up_proj.weight_scale": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.2.down_proj.weight": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.2.down_proj.weight_scale": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.2.gate_proj.weight": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.2.gate_proj.weight_scale": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.2.up_proj.weight": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.2.up_proj.weight_scale": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.20.down_proj.weight": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.20.down_proj.weight_scale": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.20.gate_proj.weight": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.20.gate_proj.weight_scale": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.20.up_proj.weight": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.20.up_proj.weight_scale": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.21.down_proj.weight": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.21.down_proj.weight_scale": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.21.gate_proj.weight": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.21.gate_proj.weight_scale": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.21.up_proj.weight": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.21.up_proj.weight_scale": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.22.down_proj.weight": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.22.down_proj.weight_scale": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.22.gate_proj.weight": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.22.gate_proj.weight_scale": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.22.up_proj.weight": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.22.up_proj.weight_scale": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.23.down_proj.weight": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.23.down_proj.weight_scale": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.23.gate_proj.weight": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.23.gate_proj.weight_scale": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.23.up_proj.weight": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.23.up_proj.weight_scale": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.24.down_proj.weight": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.24.down_proj.weight_scale": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.24.gate_proj.weight": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.24.gate_proj.weight_scale": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.24.up_proj.weight": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.24.up_proj.weight_scale": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.25.down_proj.weight": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.25.down_proj.weight_scale": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.25.gate_proj.weight": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.25.gate_proj.weight_scale": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.25.up_proj.weight": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.25.up_proj.weight_scale": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.26.down_proj.weight": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.26.down_proj.weight_scale": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.26.gate_proj.weight": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.26.gate_proj.weight_scale": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.26.up_proj.weight": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.26.up_proj.weight_scale": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.27.down_proj.weight": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.27.down_proj.weight_scale": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.27.gate_proj.weight": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.27.gate_proj.weight_scale": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.27.up_proj.weight": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.27.up_proj.weight_scale": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.28.down_proj.weight": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.28.down_proj.weight_scale": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.28.gate_proj.weight": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.28.gate_proj.weight_scale": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.28.up_proj.weight": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.28.up_proj.weight_scale": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.29.down_proj.weight": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.29.down_proj.weight_scale": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.29.gate_proj.weight": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.29.gate_proj.weight_scale": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.29.up_proj.weight": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.29.up_proj.weight_scale": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.3.down_proj.weight": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.3.down_proj.weight_scale": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.3.gate_proj.weight": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.3.gate_proj.weight_scale": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.3.up_proj.weight": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.3.up_proj.weight_scale": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.30.down_proj.weight": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.30.down_proj.weight_scale": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.30.gate_proj.weight": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.30.gate_proj.weight_scale": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.30.up_proj.weight": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.30.up_proj.weight_scale": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.31.down_proj.weight": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.31.down_proj.weight_scale": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.31.gate_proj.weight": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.31.gate_proj.weight_scale": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.31.up_proj.weight": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.31.up_proj.weight_scale": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.32.down_proj.weight": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.32.down_proj.weight_scale": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.32.gate_proj.weight": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.32.gate_proj.weight_scale": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.32.up_proj.weight": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.32.up_proj.weight_scale": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.33.down_proj.weight": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.33.down_proj.weight_scale": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.33.gate_proj.weight": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.33.gate_proj.weight_scale": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.33.up_proj.weight": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.33.up_proj.weight_scale": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.34.down_proj.weight": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.34.down_proj.weight_scale": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.34.gate_proj.weight": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.34.gate_proj.weight_scale": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.34.up_proj.weight": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.34.up_proj.weight_scale": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.35.down_proj.weight": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.35.down_proj.weight_scale": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.35.gate_proj.weight": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.35.gate_proj.weight_scale": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.35.up_proj.weight": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.35.up_proj.weight_scale": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.36.down_proj.weight": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.36.down_proj.weight_scale": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.36.gate_proj.weight": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.36.gate_proj.weight_scale": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.36.up_proj.weight": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.36.up_proj.weight_scale": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.37.down_proj.weight": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.37.down_proj.weight_scale": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.37.gate_proj.weight": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.37.gate_proj.weight_scale": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.37.up_proj.weight": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.37.up_proj.weight_scale": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.38.down_proj.weight": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.38.down_proj.weight_scale": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.38.gate_proj.weight": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.38.gate_proj.weight_scale": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.38.up_proj.weight": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.38.up_proj.weight_scale": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.39.down_proj.weight": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.39.down_proj.weight_scale": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.39.gate_proj.weight": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.39.gate_proj.weight_scale": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.39.up_proj.weight": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.39.up_proj.weight_scale": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.4.down_proj.weight": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.4.down_proj.weight_scale": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.4.gate_proj.weight": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.4.gate_proj.weight_scale": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.4.up_proj.weight": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.4.up_proj.weight_scale": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.40.down_proj.weight": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.40.down_proj.weight_scale": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.40.gate_proj.weight": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.40.gate_proj.weight_scale": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.40.up_proj.weight": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.40.up_proj.weight_scale": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.41.down_proj.weight": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.41.down_proj.weight_scale": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.41.gate_proj.weight": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.41.gate_proj.weight_scale": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.41.up_proj.weight": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.41.up_proj.weight_scale": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.42.down_proj.weight": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.42.down_proj.weight_scale": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.42.gate_proj.weight": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.42.gate_proj.weight_scale": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.42.up_proj.weight": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.42.up_proj.weight_scale": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.43.down_proj.weight": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.43.down_proj.weight_scale": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.43.gate_proj.weight": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.43.gate_proj.weight_scale": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.43.up_proj.weight": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.43.up_proj.weight_scale": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.44.down_proj.weight": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.44.down_proj.weight_scale": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.44.gate_proj.weight": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.44.gate_proj.weight_scale": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.44.up_proj.weight": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.44.up_proj.weight_scale": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.45.down_proj.weight": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.45.down_proj.weight_scale": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.45.gate_proj.weight": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.45.gate_proj.weight_scale": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.45.up_proj.weight": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.45.up_proj.weight_scale": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.46.down_proj.weight": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.46.down_proj.weight_scale": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.46.gate_proj.weight": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.46.gate_proj.weight_scale": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.46.up_proj.weight": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.46.up_proj.weight_scale": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.47.down_proj.weight": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.47.down_proj.weight_scale": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.47.gate_proj.weight": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.47.gate_proj.weight_scale": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.47.up_proj.weight": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.47.up_proj.weight_scale": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.48.down_proj.weight": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.48.down_proj.weight_scale": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.48.gate_proj.weight": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.48.gate_proj.weight_scale": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.48.up_proj.weight": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.48.up_proj.weight_scale": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.49.down_proj.weight": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.49.down_proj.weight_scale": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.49.gate_proj.weight": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.49.gate_proj.weight_scale": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.49.up_proj.weight": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.49.up_proj.weight_scale": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.5.down_proj.weight": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.5.down_proj.weight_scale": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.5.gate_proj.weight": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.5.gate_proj.weight_scale": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.5.up_proj.weight": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.5.up_proj.weight_scale": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.50.down_proj.weight": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.50.down_proj.weight_scale": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.50.gate_proj.weight": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.50.gate_proj.weight_scale": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.50.up_proj.weight": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.50.up_proj.weight_scale": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.51.down_proj.weight": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.51.down_proj.weight_scale": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.51.gate_proj.weight": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.51.gate_proj.weight_scale": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.51.up_proj.weight": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.51.up_proj.weight_scale": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.52.down_proj.weight": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.52.down_proj.weight_scale": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.52.gate_proj.weight": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.52.gate_proj.weight_scale": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.52.up_proj.weight": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.52.up_proj.weight_scale": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.53.down_proj.weight": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.53.down_proj.weight_scale": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.53.gate_proj.weight": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.53.gate_proj.weight_scale": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.53.up_proj.weight": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.53.up_proj.weight_scale": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.54.down_proj.weight": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.54.down_proj.weight_scale": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.54.gate_proj.weight": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.54.gate_proj.weight_scale": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.54.up_proj.weight": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.54.up_proj.weight_scale": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.55.down_proj.weight": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.55.down_proj.weight_scale": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.55.gate_proj.weight": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.55.gate_proj.weight_scale": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.55.up_proj.weight": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.55.up_proj.weight_scale": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.56.down_proj.weight": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.56.down_proj.weight_scale": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.56.gate_proj.weight": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.56.gate_proj.weight_scale": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.56.up_proj.weight": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.56.up_proj.weight_scale": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.57.down_proj.weight": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.57.down_proj.weight_scale": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.57.gate_proj.weight": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.57.gate_proj.weight_scale": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.57.up_proj.weight": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.57.up_proj.weight_scale": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.58.down_proj.weight": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.58.down_proj.weight_scale": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.58.gate_proj.weight": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.58.gate_proj.weight_scale": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.58.up_proj.weight": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.58.up_proj.weight_scale": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.59.down_proj.weight": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.59.down_proj.weight_scale": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.59.gate_proj.weight": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.59.gate_proj.weight_scale": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.59.up_proj.weight": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.59.up_proj.weight_scale": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.6.down_proj.weight": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.6.down_proj.weight_scale": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.6.gate_proj.weight": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.6.gate_proj.weight_scale": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.6.up_proj.weight": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.6.up_proj.weight_scale": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.60.down_proj.weight": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.60.down_proj.weight_scale": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.60.gate_proj.weight": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.60.gate_proj.weight_scale": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.60.up_proj.weight": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.60.up_proj.weight_scale": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.61.down_proj.weight": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.61.down_proj.weight_scale": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.61.gate_proj.weight": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.61.gate_proj.weight_scale": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.61.up_proj.weight": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.61.up_proj.weight_scale": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.62.down_proj.weight": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.62.down_proj.weight_scale": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.62.gate_proj.weight": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.62.gate_proj.weight_scale": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.62.up_proj.weight": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.62.up_proj.weight_scale": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.63.down_proj.weight": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.63.down_proj.weight_scale": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.63.gate_proj.weight": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.63.gate_proj.weight_scale": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.63.up_proj.weight": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.63.up_proj.weight_scale": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.64.down_proj.weight": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.64.down_proj.weight_scale": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.64.gate_proj.weight": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.64.gate_proj.weight_scale": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.64.up_proj.weight": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.64.up_proj.weight_scale": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.65.down_proj.weight": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.65.down_proj.weight_scale": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.65.gate_proj.weight": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.65.gate_proj.weight_scale": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.65.up_proj.weight": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.65.up_proj.weight_scale": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.66.down_proj.weight": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.66.down_proj.weight_scale": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.66.gate_proj.weight": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.66.gate_proj.weight_scale": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.66.up_proj.weight": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.66.up_proj.weight_scale": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.67.down_proj.weight": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.67.down_proj.weight_scale": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.67.gate_proj.weight": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.67.gate_proj.weight_scale": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.67.up_proj.weight": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.67.up_proj.weight_scale": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.68.down_proj.weight": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.68.down_proj.weight_scale": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.68.gate_proj.weight": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.68.gate_proj.weight_scale": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.68.up_proj.weight": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.68.up_proj.weight_scale": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.69.down_proj.weight": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.69.down_proj.weight_scale": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.69.gate_proj.weight": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.69.gate_proj.weight_scale": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.69.up_proj.weight": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.69.up_proj.weight_scale": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.7.down_proj.weight": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.7.down_proj.weight_scale": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.7.gate_proj.weight": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.7.gate_proj.weight_scale": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.7.up_proj.weight": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.7.up_proj.weight_scale": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.70.down_proj.weight": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.70.down_proj.weight_scale": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.70.gate_proj.weight": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.70.gate_proj.weight_scale": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.70.up_proj.weight": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.70.up_proj.weight_scale": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.71.down_proj.weight": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.71.down_proj.weight_scale": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.71.gate_proj.weight": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.71.gate_proj.weight_scale": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.71.up_proj.weight": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.71.up_proj.weight_scale": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.72.down_proj.weight": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.72.down_proj.weight_scale": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.72.gate_proj.weight": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.72.gate_proj.weight_scale": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.72.up_proj.weight": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.72.up_proj.weight_scale": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.73.down_proj.weight": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.73.down_proj.weight_scale": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.73.gate_proj.weight": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.73.gate_proj.weight_scale": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.73.up_proj.weight": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.73.up_proj.weight_scale": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.74.down_proj.weight": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.74.down_proj.weight_scale": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.74.gate_proj.weight": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.74.gate_proj.weight_scale": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.74.up_proj.weight": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.74.up_proj.weight_scale": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.75.down_proj.weight": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.75.down_proj.weight_scale": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.75.gate_proj.weight": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.75.gate_proj.weight_scale": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.75.up_proj.weight": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.75.up_proj.weight_scale": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.76.down_proj.weight": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.76.down_proj.weight_scale": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.76.gate_proj.weight": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.76.gate_proj.weight_scale": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.76.up_proj.weight": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.76.up_proj.weight_scale": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.77.down_proj.weight": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.77.down_proj.weight_scale": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.77.gate_proj.weight": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.77.gate_proj.weight_scale": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.77.up_proj.weight": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.77.up_proj.weight_scale": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.78.down_proj.weight": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.78.down_proj.weight_scale": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.78.gate_proj.weight": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.78.gate_proj.weight_scale": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.78.up_proj.weight": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.78.up_proj.weight_scale": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.79.down_proj.weight": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.79.down_proj.weight_scale": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.79.gate_proj.weight": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.79.gate_proj.weight_scale": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.79.up_proj.weight": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.79.up_proj.weight_scale": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.8.down_proj.weight": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.8.down_proj.weight_scale": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.8.gate_proj.weight": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.8.gate_proj.weight_scale": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.8.up_proj.weight": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.8.up_proj.weight_scale": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.80.down_proj.weight": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.80.down_proj.weight_scale": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.80.gate_proj.weight": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.80.gate_proj.weight_scale": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.80.up_proj.weight": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.80.up_proj.weight_scale": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.81.down_proj.weight": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.81.down_proj.weight_scale": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.81.gate_proj.weight": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.81.gate_proj.weight_scale": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.81.up_proj.weight": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.81.up_proj.weight_scale": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.82.down_proj.weight": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.82.down_proj.weight_scale": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.82.gate_proj.weight": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.82.gate_proj.weight_scale": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.82.up_proj.weight": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.82.up_proj.weight_scale": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.83.down_proj.weight": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.83.down_proj.weight_scale": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.83.gate_proj.weight": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.83.gate_proj.weight_scale": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.83.up_proj.weight": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.83.up_proj.weight_scale": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.84.down_proj.weight": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.84.down_proj.weight_scale": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.84.gate_proj.weight": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.84.gate_proj.weight_scale": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.84.up_proj.weight": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.84.up_proj.weight_scale": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.85.down_proj.weight": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.85.down_proj.weight_scale": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.85.gate_proj.weight": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.85.gate_proj.weight_scale": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.85.up_proj.weight": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.85.up_proj.weight_scale": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.86.down_proj.weight": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.86.down_proj.weight_scale": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.86.gate_proj.weight": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.86.gate_proj.weight_scale": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.86.up_proj.weight": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.86.up_proj.weight_scale": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.87.down_proj.weight": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.87.down_proj.weight_scale": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.87.gate_proj.weight": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.87.gate_proj.weight_scale": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.87.up_proj.weight": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.87.up_proj.weight_scale": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.88.down_proj.weight": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.88.down_proj.weight_scale": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.88.gate_proj.weight": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.88.gate_proj.weight_scale": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.88.up_proj.weight": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.88.up_proj.weight_scale": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.89.down_proj.weight": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.89.down_proj.weight_scale": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.89.gate_proj.weight": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.89.gate_proj.weight_scale": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.89.up_proj.weight": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.89.up_proj.weight_scale": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.9.down_proj.weight": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.9.down_proj.weight_scale": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.9.gate_proj.weight": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.9.gate_proj.weight_scale": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.9.up_proj.weight": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.9.up_proj.weight_scale": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.90.down_proj.weight": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.90.down_proj.weight_scale": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.90.gate_proj.weight": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.90.gate_proj.weight_scale": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.90.up_proj.weight": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.90.up_proj.weight_scale": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.91.down_proj.weight": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.91.down_proj.weight_scale": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.91.gate_proj.weight": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.91.gate_proj.weight_scale": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.91.up_proj.weight": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.91.up_proj.weight_scale": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.92.down_proj.weight": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.92.down_proj.weight_scale": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.92.gate_proj.weight": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.92.gate_proj.weight_scale": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.92.up_proj.weight": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.92.up_proj.weight_scale": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.93.down_proj.weight": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.93.down_proj.weight_scale": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.93.gate_proj.weight": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.93.gate_proj.weight_scale": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.93.up_proj.weight": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.93.up_proj.weight_scale": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.94.down_proj.weight": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.94.down_proj.weight_scale": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.94.gate_proj.weight": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.94.gate_proj.weight_scale": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.94.up_proj.weight": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.94.up_proj.weight_scale": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.95.down_proj.weight": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.95.down_proj.weight_scale": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.95.gate_proj.weight": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.95.gate_proj.weight_scale": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.95.up_proj.weight": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.95.up_proj.weight_scale": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.96.down_proj.weight": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.96.down_proj.weight_scale": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.96.gate_proj.weight": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.96.gate_proj.weight_scale": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.96.up_proj.weight": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.96.up_proj.weight_scale": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.97.down_proj.weight": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.97.down_proj.weight_scale": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.97.gate_proj.weight": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.97.gate_proj.weight_scale": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.97.up_proj.weight": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.97.up_proj.weight_scale": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.98.down_proj.weight": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.98.down_proj.weight_scale": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.98.gate_proj.weight": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.98.gate_proj.weight_scale": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.98.up_proj.weight": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.98.up_proj.weight_scale": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.99.down_proj.weight": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.99.down_proj.weight_scale": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.99.gate_proj.weight": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.99.gate_proj.weight_scale": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.99.up_proj.weight": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.99.up_proj.weight_scale": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.gate.e_score_correction_bias": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.gate.weight": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.shared_experts.down_proj.weight": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.shared_experts.down_proj.weight_scale": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.shared_experts.gate_proj.weight": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.shared_experts.gate_proj.weight_scale": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.shared_experts.up_proj.weight": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.shared_experts.up_proj.weight_scale": "model-00043-of-00092.safetensors",
+ "model.layers.42.post_attention_layernorm.weight": "model-00043-of-00092.safetensors",
+ "model.layers.42.self_attn.k_norm.weight": "model-00043-of-00092.safetensors",
+ "model.layers.42.self_attn.k_proj.bias": "model-00043-of-00092.safetensors",
+ "model.layers.42.self_attn.k_proj.weight": "model-00043-of-00092.safetensors",
+ "model.layers.42.self_attn.k_proj.weight_scale": "model-00043-of-00092.safetensors",
+ "model.layers.42.self_attn.o_proj.weight": "model-00043-of-00092.safetensors",
+ "model.layers.42.self_attn.o_proj.weight_scale": "model-00043-of-00092.safetensors",
+ "model.layers.42.self_attn.q_norm.weight": "model-00043-of-00092.safetensors",
+ "model.layers.42.self_attn.q_proj.bias": "model-00043-of-00092.safetensors",
+ "model.layers.42.self_attn.q_proj.weight": "model-00043-of-00092.safetensors",
+ "model.layers.42.self_attn.q_proj.weight_scale": "model-00043-of-00092.safetensors",
+ "model.layers.42.self_attn.v_proj.bias": "model-00043-of-00092.safetensors",
+ "model.layers.42.self_attn.v_proj.weight": "model-00043-of-00092.safetensors",
+ "model.layers.42.self_attn.v_proj.weight_scale": "model-00043-of-00092.safetensors",
+ "model.layers.43.input_layernorm.weight": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.0.down_proj.weight": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.0.down_proj.weight_scale": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.0.gate_proj.weight": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.0.gate_proj.weight_scale": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.0.up_proj.weight": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.0.up_proj.weight_scale": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.1.down_proj.weight": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.1.down_proj.weight_scale": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.1.gate_proj.weight": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.1.gate_proj.weight_scale": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.1.up_proj.weight": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.1.up_proj.weight_scale": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.10.down_proj.weight": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.10.down_proj.weight_scale": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.10.gate_proj.weight": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.10.gate_proj.weight_scale": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.10.up_proj.weight": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.10.up_proj.weight_scale": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.100.down_proj.weight": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.100.down_proj.weight_scale": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.100.gate_proj.weight": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.100.gate_proj.weight_scale": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.100.up_proj.weight": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.100.up_proj.weight_scale": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.101.down_proj.weight": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.101.down_proj.weight_scale": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.101.gate_proj.weight": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.101.gate_proj.weight_scale": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.101.up_proj.weight": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.101.up_proj.weight_scale": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.102.down_proj.weight": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.102.down_proj.weight_scale": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.102.gate_proj.weight": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.102.gate_proj.weight_scale": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.102.up_proj.weight": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.102.up_proj.weight_scale": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.103.down_proj.weight": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.103.down_proj.weight_scale": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.103.gate_proj.weight": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.103.gate_proj.weight_scale": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.103.up_proj.weight": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.103.up_proj.weight_scale": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.104.down_proj.weight": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.104.down_proj.weight_scale": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.104.gate_proj.weight": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.104.gate_proj.weight_scale": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.104.up_proj.weight": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.104.up_proj.weight_scale": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.105.down_proj.weight": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.105.down_proj.weight_scale": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.105.gate_proj.weight": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.105.gate_proj.weight_scale": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.105.up_proj.weight": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.105.up_proj.weight_scale": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.106.down_proj.weight": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.106.down_proj.weight_scale": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.106.gate_proj.weight": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.106.gate_proj.weight_scale": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.106.up_proj.weight": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.106.up_proj.weight_scale": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.107.down_proj.weight": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.107.down_proj.weight_scale": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.107.gate_proj.weight": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.107.gate_proj.weight_scale": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.107.up_proj.weight": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.107.up_proj.weight_scale": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.108.down_proj.weight": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.108.down_proj.weight_scale": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.108.gate_proj.weight": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.108.gate_proj.weight_scale": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.108.up_proj.weight": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.108.up_proj.weight_scale": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.109.down_proj.weight": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.109.down_proj.weight_scale": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.109.gate_proj.weight": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.109.gate_proj.weight_scale": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.109.up_proj.weight": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.109.up_proj.weight_scale": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.11.down_proj.weight": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.11.down_proj.weight_scale": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.11.gate_proj.weight": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.11.gate_proj.weight_scale": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.11.up_proj.weight": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.11.up_proj.weight_scale": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.110.down_proj.weight": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.110.down_proj.weight_scale": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.110.gate_proj.weight": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.110.gate_proj.weight_scale": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.110.up_proj.weight": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.110.up_proj.weight_scale": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.111.down_proj.weight": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.111.down_proj.weight_scale": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.111.gate_proj.weight": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.111.gate_proj.weight_scale": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.111.up_proj.weight": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.111.up_proj.weight_scale": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.112.down_proj.weight": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.112.down_proj.weight_scale": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.112.gate_proj.weight": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.112.gate_proj.weight_scale": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.112.up_proj.weight": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.112.up_proj.weight_scale": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.113.down_proj.weight": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.113.down_proj.weight_scale": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.113.gate_proj.weight": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.113.gate_proj.weight_scale": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.113.up_proj.weight": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.113.up_proj.weight_scale": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.114.down_proj.weight": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.114.down_proj.weight_scale": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.114.gate_proj.weight": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.114.gate_proj.weight_scale": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.114.up_proj.weight": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.114.up_proj.weight_scale": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.115.down_proj.weight": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.115.down_proj.weight_scale": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.115.gate_proj.weight": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.115.gate_proj.weight_scale": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.115.up_proj.weight": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.115.up_proj.weight_scale": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.116.down_proj.weight": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.116.down_proj.weight_scale": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.116.gate_proj.weight": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.116.gate_proj.weight_scale": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.116.up_proj.weight": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.116.up_proj.weight_scale": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.117.down_proj.weight": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.117.down_proj.weight_scale": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.117.gate_proj.weight": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.117.gate_proj.weight_scale": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.117.up_proj.weight": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.117.up_proj.weight_scale": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.118.down_proj.weight": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.118.down_proj.weight_scale": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.118.gate_proj.weight": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.118.gate_proj.weight_scale": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.118.up_proj.weight": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.118.up_proj.weight_scale": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.119.down_proj.weight": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.119.down_proj.weight_scale": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.119.gate_proj.weight": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.119.gate_proj.weight_scale": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.119.up_proj.weight": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.119.up_proj.weight_scale": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.12.down_proj.weight": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.12.down_proj.weight_scale": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.12.gate_proj.weight": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.12.gate_proj.weight_scale": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.12.up_proj.weight": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.12.up_proj.weight_scale": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.120.down_proj.weight": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.120.down_proj.weight_scale": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.120.gate_proj.weight": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.120.gate_proj.weight_scale": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.120.up_proj.weight": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.120.up_proj.weight_scale": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.121.down_proj.weight": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.121.down_proj.weight_scale": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.121.gate_proj.weight": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.121.gate_proj.weight_scale": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.121.up_proj.weight": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.121.up_proj.weight_scale": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.122.down_proj.weight": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.122.down_proj.weight_scale": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.122.gate_proj.weight": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.122.gate_proj.weight_scale": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.122.up_proj.weight": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.122.up_proj.weight_scale": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.123.down_proj.weight": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.123.down_proj.weight_scale": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.123.gate_proj.weight": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.123.gate_proj.weight_scale": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.123.up_proj.weight": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.123.up_proj.weight_scale": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.124.down_proj.weight": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.124.down_proj.weight_scale": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.124.gate_proj.weight": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.124.gate_proj.weight_scale": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.124.up_proj.weight": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.124.up_proj.weight_scale": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.125.down_proj.weight": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.125.down_proj.weight_scale": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.125.gate_proj.weight": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.125.gate_proj.weight_scale": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.125.up_proj.weight": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.125.up_proj.weight_scale": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.126.down_proj.weight": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.126.down_proj.weight_scale": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.126.gate_proj.weight": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.126.gate_proj.weight_scale": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.126.up_proj.weight": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.126.up_proj.weight_scale": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.127.down_proj.weight": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.127.down_proj.weight_scale": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.127.gate_proj.weight": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.127.gate_proj.weight_scale": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.127.up_proj.weight": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.127.up_proj.weight_scale": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.128.down_proj.weight": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.128.down_proj.weight_scale": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.128.gate_proj.weight": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.128.gate_proj.weight_scale": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.128.up_proj.weight": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.128.up_proj.weight_scale": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.129.down_proj.weight": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.129.down_proj.weight_scale": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.129.gate_proj.weight": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.129.gate_proj.weight_scale": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.129.up_proj.weight": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.129.up_proj.weight_scale": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.13.down_proj.weight": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.13.down_proj.weight_scale": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.13.gate_proj.weight": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.13.gate_proj.weight_scale": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.13.up_proj.weight": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.13.up_proj.weight_scale": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.130.down_proj.weight": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.130.down_proj.weight_scale": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.130.gate_proj.weight": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.130.gate_proj.weight_scale": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.130.up_proj.weight": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.130.up_proj.weight_scale": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.131.down_proj.weight": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.131.down_proj.weight_scale": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.131.gate_proj.weight": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.131.gate_proj.weight_scale": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.131.up_proj.weight": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.131.up_proj.weight_scale": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.132.down_proj.weight": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.132.down_proj.weight_scale": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.132.gate_proj.weight": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.132.gate_proj.weight_scale": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.132.up_proj.weight": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.132.up_proj.weight_scale": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.133.down_proj.weight": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.133.down_proj.weight_scale": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.133.gate_proj.weight": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.133.gate_proj.weight_scale": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.133.up_proj.weight": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.133.up_proj.weight_scale": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.134.down_proj.weight": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.134.down_proj.weight_scale": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.134.gate_proj.weight": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.134.gate_proj.weight_scale": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.134.up_proj.weight": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.134.up_proj.weight_scale": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.135.down_proj.weight": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.135.down_proj.weight_scale": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.135.gate_proj.weight": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.135.gate_proj.weight_scale": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.135.up_proj.weight": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.135.up_proj.weight_scale": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.136.down_proj.weight": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.136.down_proj.weight_scale": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.136.gate_proj.weight": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.136.gate_proj.weight_scale": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.136.up_proj.weight": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.136.up_proj.weight_scale": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.137.down_proj.weight": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.137.down_proj.weight_scale": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.137.gate_proj.weight": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.137.gate_proj.weight_scale": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.137.up_proj.weight": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.137.up_proj.weight_scale": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.138.down_proj.weight": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.138.down_proj.weight_scale": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.138.gate_proj.weight": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.138.gate_proj.weight_scale": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.138.up_proj.weight": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.138.up_proj.weight_scale": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.139.down_proj.weight": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.139.down_proj.weight_scale": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.139.gate_proj.weight": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.139.gate_proj.weight_scale": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.139.up_proj.weight": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.139.up_proj.weight_scale": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.14.down_proj.weight": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.14.down_proj.weight_scale": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.14.gate_proj.weight": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.14.gate_proj.weight_scale": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.14.up_proj.weight": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.14.up_proj.weight_scale": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.140.down_proj.weight": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.140.down_proj.weight_scale": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.140.gate_proj.weight": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.140.gate_proj.weight_scale": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.140.up_proj.weight": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.140.up_proj.weight_scale": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.141.down_proj.weight": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.141.down_proj.weight_scale": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.141.gate_proj.weight": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.141.gate_proj.weight_scale": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.141.up_proj.weight": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.141.up_proj.weight_scale": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.142.down_proj.weight": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.142.down_proj.weight_scale": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.142.gate_proj.weight": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.142.gate_proj.weight_scale": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.142.up_proj.weight": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.142.up_proj.weight_scale": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.143.down_proj.weight": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.143.down_proj.weight_scale": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.143.gate_proj.weight": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.143.gate_proj.weight_scale": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.143.up_proj.weight": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.143.up_proj.weight_scale": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.144.down_proj.weight": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.144.down_proj.weight_scale": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.144.gate_proj.weight": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.144.gate_proj.weight_scale": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.144.up_proj.weight": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.144.up_proj.weight_scale": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.145.down_proj.weight": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.145.down_proj.weight_scale": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.145.gate_proj.weight": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.145.gate_proj.weight_scale": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.145.up_proj.weight": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.145.up_proj.weight_scale": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.146.down_proj.weight": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.146.down_proj.weight_scale": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.146.gate_proj.weight": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.146.gate_proj.weight_scale": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.146.up_proj.weight": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.146.up_proj.weight_scale": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.147.down_proj.weight": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.147.down_proj.weight_scale": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.147.gate_proj.weight": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.147.gate_proj.weight_scale": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.147.up_proj.weight": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.147.up_proj.weight_scale": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.148.down_proj.weight": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.148.down_proj.weight_scale": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.148.gate_proj.weight": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.148.gate_proj.weight_scale": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.148.up_proj.weight": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.148.up_proj.weight_scale": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.149.down_proj.weight": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.149.down_proj.weight_scale": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.149.gate_proj.weight": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.149.gate_proj.weight_scale": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.149.up_proj.weight": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.149.up_proj.weight_scale": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.15.down_proj.weight": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.15.down_proj.weight_scale": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.15.gate_proj.weight": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.15.gate_proj.weight_scale": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.15.up_proj.weight": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.15.up_proj.weight_scale": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.150.down_proj.weight": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.150.down_proj.weight_scale": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.150.gate_proj.weight": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.150.gate_proj.weight_scale": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.150.up_proj.weight": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.150.up_proj.weight_scale": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.151.down_proj.weight": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.151.down_proj.weight_scale": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.151.gate_proj.weight": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.151.gate_proj.weight_scale": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.151.up_proj.weight": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.151.up_proj.weight_scale": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.152.down_proj.weight": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.152.down_proj.weight_scale": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.152.gate_proj.weight": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.152.gate_proj.weight_scale": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.152.up_proj.weight": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.152.up_proj.weight_scale": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.153.down_proj.weight": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.153.down_proj.weight_scale": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.153.gate_proj.weight": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.153.gate_proj.weight_scale": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.153.up_proj.weight": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.153.up_proj.weight_scale": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.154.down_proj.weight": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.154.down_proj.weight_scale": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.154.gate_proj.weight": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.154.gate_proj.weight_scale": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.154.up_proj.weight": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.154.up_proj.weight_scale": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.155.down_proj.weight": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.155.down_proj.weight_scale": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.155.gate_proj.weight": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.155.gate_proj.weight_scale": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.155.up_proj.weight": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.155.up_proj.weight_scale": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.156.down_proj.weight": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.156.down_proj.weight_scale": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.156.gate_proj.weight": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.156.gate_proj.weight_scale": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.156.up_proj.weight": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.156.up_proj.weight_scale": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.157.down_proj.weight": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.157.down_proj.weight_scale": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.157.gate_proj.weight": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.157.gate_proj.weight_scale": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.157.up_proj.weight": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.157.up_proj.weight_scale": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.158.down_proj.weight": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.158.down_proj.weight_scale": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.158.gate_proj.weight": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.158.gate_proj.weight_scale": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.158.up_proj.weight": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.158.up_proj.weight_scale": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.159.down_proj.weight": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.159.down_proj.weight_scale": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.159.gate_proj.weight": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.159.gate_proj.weight_scale": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.159.up_proj.weight": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.159.up_proj.weight_scale": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.16.down_proj.weight": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.16.down_proj.weight_scale": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.16.gate_proj.weight": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.16.gate_proj.weight_scale": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.16.up_proj.weight": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.16.up_proj.weight_scale": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.17.down_proj.weight": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.17.down_proj.weight_scale": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.17.gate_proj.weight": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.17.gate_proj.weight_scale": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.17.up_proj.weight": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.17.up_proj.weight_scale": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.18.down_proj.weight": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.18.down_proj.weight_scale": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.18.gate_proj.weight": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.18.gate_proj.weight_scale": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.18.up_proj.weight": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.18.up_proj.weight_scale": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.19.down_proj.weight": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.19.down_proj.weight_scale": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.19.gate_proj.weight": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.19.gate_proj.weight_scale": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.19.up_proj.weight": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.19.up_proj.weight_scale": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.2.down_proj.weight": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.2.down_proj.weight_scale": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.2.gate_proj.weight": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.2.gate_proj.weight_scale": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.2.up_proj.weight": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.2.up_proj.weight_scale": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.20.down_proj.weight": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.20.down_proj.weight_scale": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.20.gate_proj.weight": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.20.gate_proj.weight_scale": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.20.up_proj.weight": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.20.up_proj.weight_scale": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.21.down_proj.weight": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.21.down_proj.weight_scale": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.21.gate_proj.weight": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.21.gate_proj.weight_scale": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.21.up_proj.weight": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.21.up_proj.weight_scale": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.22.down_proj.weight": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.22.down_proj.weight_scale": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.22.gate_proj.weight": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.22.gate_proj.weight_scale": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.22.up_proj.weight": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.22.up_proj.weight_scale": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.23.down_proj.weight": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.23.down_proj.weight_scale": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.23.gate_proj.weight": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.23.gate_proj.weight_scale": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.23.up_proj.weight": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.23.up_proj.weight_scale": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.24.down_proj.weight": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.24.down_proj.weight_scale": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.24.gate_proj.weight": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.24.gate_proj.weight_scale": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.24.up_proj.weight": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.24.up_proj.weight_scale": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.25.down_proj.weight": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.25.down_proj.weight_scale": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.25.gate_proj.weight": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.25.gate_proj.weight_scale": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.25.up_proj.weight": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.25.up_proj.weight_scale": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.26.down_proj.weight": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.26.down_proj.weight_scale": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.26.gate_proj.weight": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.26.gate_proj.weight_scale": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.26.up_proj.weight": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.26.up_proj.weight_scale": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.27.down_proj.weight": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.27.down_proj.weight_scale": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.27.gate_proj.weight": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.27.gate_proj.weight_scale": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.27.up_proj.weight": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.27.up_proj.weight_scale": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.28.down_proj.weight": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.28.down_proj.weight_scale": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.28.gate_proj.weight": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.28.gate_proj.weight_scale": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.28.up_proj.weight": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.28.up_proj.weight_scale": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.29.down_proj.weight": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.29.down_proj.weight_scale": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.29.gate_proj.weight": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.29.gate_proj.weight_scale": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.29.up_proj.weight": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.29.up_proj.weight_scale": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.3.down_proj.weight": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.3.down_proj.weight_scale": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.3.gate_proj.weight": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.3.gate_proj.weight_scale": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.3.up_proj.weight": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.3.up_proj.weight_scale": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.30.down_proj.weight": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.30.down_proj.weight_scale": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.30.gate_proj.weight": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.30.gate_proj.weight_scale": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.30.up_proj.weight": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.30.up_proj.weight_scale": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.31.down_proj.weight": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.31.down_proj.weight_scale": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.31.gate_proj.weight": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.31.gate_proj.weight_scale": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.31.up_proj.weight": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.31.up_proj.weight_scale": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.32.down_proj.weight": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.32.down_proj.weight_scale": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.32.gate_proj.weight": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.32.gate_proj.weight_scale": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.32.up_proj.weight": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.32.up_proj.weight_scale": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.33.down_proj.weight": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.33.down_proj.weight_scale": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.33.gate_proj.weight": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.33.gate_proj.weight_scale": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.33.up_proj.weight": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.33.up_proj.weight_scale": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.34.down_proj.weight": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.34.down_proj.weight_scale": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.34.gate_proj.weight": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.34.gate_proj.weight_scale": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.34.up_proj.weight": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.34.up_proj.weight_scale": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.35.down_proj.weight": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.35.down_proj.weight_scale": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.35.gate_proj.weight": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.35.gate_proj.weight_scale": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.35.up_proj.weight": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.35.up_proj.weight_scale": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.36.down_proj.weight": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.36.down_proj.weight_scale": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.36.gate_proj.weight": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.36.gate_proj.weight_scale": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.36.up_proj.weight": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.36.up_proj.weight_scale": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.37.down_proj.weight": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.37.down_proj.weight_scale": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.37.gate_proj.weight": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.37.gate_proj.weight_scale": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.37.up_proj.weight": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.37.up_proj.weight_scale": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.38.down_proj.weight": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.38.down_proj.weight_scale": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.38.gate_proj.weight": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.38.gate_proj.weight_scale": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.38.up_proj.weight": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.38.up_proj.weight_scale": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.39.down_proj.weight": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.39.down_proj.weight_scale": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.39.gate_proj.weight": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.39.gate_proj.weight_scale": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.39.up_proj.weight": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.39.up_proj.weight_scale": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.4.down_proj.weight": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.4.down_proj.weight_scale": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.4.gate_proj.weight": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.4.gate_proj.weight_scale": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.4.up_proj.weight": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.4.up_proj.weight_scale": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.40.down_proj.weight": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.40.down_proj.weight_scale": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.40.gate_proj.weight": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.40.gate_proj.weight_scale": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.40.up_proj.weight": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.40.up_proj.weight_scale": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.41.down_proj.weight": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.41.down_proj.weight_scale": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.41.gate_proj.weight": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.41.gate_proj.weight_scale": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.41.up_proj.weight": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.41.up_proj.weight_scale": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.42.down_proj.weight": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.42.down_proj.weight_scale": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.42.gate_proj.weight": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.42.gate_proj.weight_scale": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.42.up_proj.weight": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.42.up_proj.weight_scale": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.43.down_proj.weight": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.43.down_proj.weight_scale": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.43.gate_proj.weight": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.43.gate_proj.weight_scale": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.43.up_proj.weight": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.43.up_proj.weight_scale": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.44.down_proj.weight": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.44.down_proj.weight_scale": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.44.gate_proj.weight": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.44.gate_proj.weight_scale": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.44.up_proj.weight": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.44.up_proj.weight_scale": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.45.down_proj.weight": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.45.down_proj.weight_scale": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.45.gate_proj.weight": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.45.gate_proj.weight_scale": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.45.up_proj.weight": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.45.up_proj.weight_scale": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.46.down_proj.weight": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.46.down_proj.weight_scale": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.46.gate_proj.weight": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.46.gate_proj.weight_scale": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.46.up_proj.weight": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.46.up_proj.weight_scale": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.47.down_proj.weight": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.47.down_proj.weight_scale": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.47.gate_proj.weight": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.47.gate_proj.weight_scale": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.47.up_proj.weight": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.47.up_proj.weight_scale": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.48.down_proj.weight": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.48.down_proj.weight_scale": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.48.gate_proj.weight": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.48.gate_proj.weight_scale": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.48.up_proj.weight": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.48.up_proj.weight_scale": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.49.down_proj.weight": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.49.down_proj.weight_scale": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.49.gate_proj.weight": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.49.gate_proj.weight_scale": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.49.up_proj.weight": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.49.up_proj.weight_scale": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.5.down_proj.weight": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.5.down_proj.weight_scale": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.5.gate_proj.weight": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.5.gate_proj.weight_scale": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.5.up_proj.weight": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.5.up_proj.weight_scale": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.50.down_proj.weight": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.50.down_proj.weight_scale": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.50.gate_proj.weight": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.50.gate_proj.weight_scale": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.50.up_proj.weight": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.50.up_proj.weight_scale": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.51.down_proj.weight": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.51.down_proj.weight_scale": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.51.gate_proj.weight": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.51.gate_proj.weight_scale": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.51.up_proj.weight": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.51.up_proj.weight_scale": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.52.down_proj.weight": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.52.down_proj.weight_scale": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.52.gate_proj.weight": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.52.gate_proj.weight_scale": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.52.up_proj.weight": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.52.up_proj.weight_scale": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.53.down_proj.weight": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.53.down_proj.weight_scale": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.53.gate_proj.weight": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.53.gate_proj.weight_scale": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.53.up_proj.weight": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.53.up_proj.weight_scale": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.54.down_proj.weight": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.54.down_proj.weight_scale": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.54.gate_proj.weight": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.54.gate_proj.weight_scale": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.54.up_proj.weight": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.54.up_proj.weight_scale": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.55.down_proj.weight": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.55.down_proj.weight_scale": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.55.gate_proj.weight": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.55.gate_proj.weight_scale": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.55.up_proj.weight": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.55.up_proj.weight_scale": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.56.down_proj.weight": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.56.down_proj.weight_scale": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.56.gate_proj.weight": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.56.gate_proj.weight_scale": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.56.up_proj.weight": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.56.up_proj.weight_scale": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.57.down_proj.weight": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.57.down_proj.weight_scale": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.57.gate_proj.weight": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.57.gate_proj.weight_scale": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.57.up_proj.weight": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.57.up_proj.weight_scale": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.58.down_proj.weight": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.58.down_proj.weight_scale": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.58.gate_proj.weight": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.58.gate_proj.weight_scale": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.58.up_proj.weight": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.58.up_proj.weight_scale": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.59.down_proj.weight": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.59.down_proj.weight_scale": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.59.gate_proj.weight": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.59.gate_proj.weight_scale": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.59.up_proj.weight": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.59.up_proj.weight_scale": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.6.down_proj.weight": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.6.down_proj.weight_scale": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.6.gate_proj.weight": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.6.gate_proj.weight_scale": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.6.up_proj.weight": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.6.up_proj.weight_scale": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.60.down_proj.weight": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.60.down_proj.weight_scale": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.60.gate_proj.weight": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.60.gate_proj.weight_scale": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.60.up_proj.weight": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.60.up_proj.weight_scale": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.61.down_proj.weight": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.61.down_proj.weight_scale": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.61.gate_proj.weight": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.61.gate_proj.weight_scale": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.61.up_proj.weight": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.61.up_proj.weight_scale": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.62.down_proj.weight": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.62.down_proj.weight_scale": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.62.gate_proj.weight": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.62.gate_proj.weight_scale": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.62.up_proj.weight": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.62.up_proj.weight_scale": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.63.down_proj.weight": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.63.down_proj.weight_scale": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.63.gate_proj.weight": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.63.gate_proj.weight_scale": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.63.up_proj.weight": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.63.up_proj.weight_scale": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.64.down_proj.weight": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.64.down_proj.weight_scale": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.64.gate_proj.weight": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.64.gate_proj.weight_scale": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.64.up_proj.weight": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.64.up_proj.weight_scale": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.65.down_proj.weight": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.65.down_proj.weight_scale": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.65.gate_proj.weight": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.65.gate_proj.weight_scale": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.65.up_proj.weight": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.65.up_proj.weight_scale": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.66.down_proj.weight": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.66.down_proj.weight_scale": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.66.gate_proj.weight": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.66.gate_proj.weight_scale": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.66.up_proj.weight": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.66.up_proj.weight_scale": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.67.down_proj.weight": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.67.down_proj.weight_scale": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.67.gate_proj.weight": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.67.gate_proj.weight_scale": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.67.up_proj.weight": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.67.up_proj.weight_scale": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.68.down_proj.weight": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.68.down_proj.weight_scale": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.68.gate_proj.weight": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.68.gate_proj.weight_scale": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.68.up_proj.weight": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.68.up_proj.weight_scale": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.69.down_proj.weight": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.69.down_proj.weight_scale": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.69.gate_proj.weight": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.69.gate_proj.weight_scale": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.69.up_proj.weight": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.69.up_proj.weight_scale": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.7.down_proj.weight": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.7.down_proj.weight_scale": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.7.gate_proj.weight": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.7.gate_proj.weight_scale": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.7.up_proj.weight": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.7.up_proj.weight_scale": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.70.down_proj.weight": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.70.down_proj.weight_scale": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.70.gate_proj.weight": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.70.gate_proj.weight_scale": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.70.up_proj.weight": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.70.up_proj.weight_scale": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.71.down_proj.weight": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.71.down_proj.weight_scale": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.71.gate_proj.weight": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.71.gate_proj.weight_scale": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.71.up_proj.weight": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.71.up_proj.weight_scale": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.72.down_proj.weight": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.72.down_proj.weight_scale": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.72.gate_proj.weight": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.72.gate_proj.weight_scale": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.72.up_proj.weight": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.72.up_proj.weight_scale": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.73.down_proj.weight": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.73.down_proj.weight_scale": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.73.gate_proj.weight": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.73.gate_proj.weight_scale": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.73.up_proj.weight": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.73.up_proj.weight_scale": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.74.down_proj.weight": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.74.down_proj.weight_scale": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.74.gate_proj.weight": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.74.gate_proj.weight_scale": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.74.up_proj.weight": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.74.up_proj.weight_scale": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.75.down_proj.weight": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.75.down_proj.weight_scale": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.75.gate_proj.weight": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.75.gate_proj.weight_scale": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.75.up_proj.weight": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.75.up_proj.weight_scale": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.76.down_proj.weight": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.76.down_proj.weight_scale": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.76.gate_proj.weight": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.76.gate_proj.weight_scale": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.76.up_proj.weight": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.76.up_proj.weight_scale": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.77.down_proj.weight": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.77.down_proj.weight_scale": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.77.gate_proj.weight": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.77.gate_proj.weight_scale": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.77.up_proj.weight": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.77.up_proj.weight_scale": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.78.down_proj.weight": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.78.down_proj.weight_scale": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.78.gate_proj.weight": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.78.gate_proj.weight_scale": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.78.up_proj.weight": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.78.up_proj.weight_scale": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.79.down_proj.weight": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.79.down_proj.weight_scale": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.79.gate_proj.weight": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.79.gate_proj.weight_scale": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.79.up_proj.weight": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.79.up_proj.weight_scale": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.8.down_proj.weight": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.8.down_proj.weight_scale": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.8.gate_proj.weight": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.8.gate_proj.weight_scale": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.8.up_proj.weight": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.8.up_proj.weight_scale": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.80.down_proj.weight": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.80.down_proj.weight_scale": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.80.gate_proj.weight": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.80.gate_proj.weight_scale": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.80.up_proj.weight": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.80.up_proj.weight_scale": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.81.down_proj.weight": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.81.down_proj.weight_scale": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.81.gate_proj.weight": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.81.gate_proj.weight_scale": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.81.up_proj.weight": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.81.up_proj.weight_scale": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.82.down_proj.weight": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.82.down_proj.weight_scale": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.82.gate_proj.weight": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.82.gate_proj.weight_scale": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.82.up_proj.weight": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.82.up_proj.weight_scale": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.83.down_proj.weight": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.83.down_proj.weight_scale": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.83.gate_proj.weight": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.83.gate_proj.weight_scale": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.83.up_proj.weight": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.83.up_proj.weight_scale": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.84.down_proj.weight": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.84.down_proj.weight_scale": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.84.gate_proj.weight": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.84.gate_proj.weight_scale": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.84.up_proj.weight": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.84.up_proj.weight_scale": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.85.down_proj.weight": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.85.down_proj.weight_scale": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.85.gate_proj.weight": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.85.gate_proj.weight_scale": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.85.up_proj.weight": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.85.up_proj.weight_scale": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.86.down_proj.weight": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.86.down_proj.weight_scale": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.86.gate_proj.weight": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.86.gate_proj.weight_scale": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.86.up_proj.weight": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.86.up_proj.weight_scale": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.87.down_proj.weight": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.87.down_proj.weight_scale": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.87.gate_proj.weight": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.87.gate_proj.weight_scale": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.87.up_proj.weight": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.87.up_proj.weight_scale": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.88.down_proj.weight": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.88.down_proj.weight_scale": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.88.gate_proj.weight": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.88.gate_proj.weight_scale": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.88.up_proj.weight": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.88.up_proj.weight_scale": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.89.down_proj.weight": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.89.down_proj.weight_scale": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.89.gate_proj.weight": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.89.gate_proj.weight_scale": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.89.up_proj.weight": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.89.up_proj.weight_scale": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.9.down_proj.weight": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.9.down_proj.weight_scale": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.9.gate_proj.weight": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.9.gate_proj.weight_scale": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.9.up_proj.weight": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.9.up_proj.weight_scale": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.90.down_proj.weight": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.90.down_proj.weight_scale": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.90.gate_proj.weight": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.90.gate_proj.weight_scale": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.90.up_proj.weight": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.90.up_proj.weight_scale": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.91.down_proj.weight": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.91.down_proj.weight_scale": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.91.gate_proj.weight": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.91.gate_proj.weight_scale": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.91.up_proj.weight": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.91.up_proj.weight_scale": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.92.down_proj.weight": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.92.down_proj.weight_scale": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.92.gate_proj.weight": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.92.gate_proj.weight_scale": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.92.up_proj.weight": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.92.up_proj.weight_scale": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.93.down_proj.weight": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.93.down_proj.weight_scale": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.93.gate_proj.weight": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.93.gate_proj.weight_scale": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.93.up_proj.weight": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.93.up_proj.weight_scale": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.94.down_proj.weight": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.94.down_proj.weight_scale": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.94.gate_proj.weight": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.94.gate_proj.weight_scale": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.94.up_proj.weight": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.94.up_proj.weight_scale": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.95.down_proj.weight": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.95.down_proj.weight_scale": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.95.gate_proj.weight": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.95.gate_proj.weight_scale": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.95.up_proj.weight": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.95.up_proj.weight_scale": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.96.down_proj.weight": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.96.down_proj.weight_scale": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.96.gate_proj.weight": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.96.gate_proj.weight_scale": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.96.up_proj.weight": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.96.up_proj.weight_scale": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.97.down_proj.weight": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.97.down_proj.weight_scale": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.97.gate_proj.weight": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.97.gate_proj.weight_scale": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.97.up_proj.weight": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.97.up_proj.weight_scale": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.98.down_proj.weight": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.98.down_proj.weight_scale": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.98.gate_proj.weight": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.98.gate_proj.weight_scale": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.98.up_proj.weight": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.98.up_proj.weight_scale": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.99.down_proj.weight": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.99.down_proj.weight_scale": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.99.gate_proj.weight": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.99.gate_proj.weight_scale": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.99.up_proj.weight": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.99.up_proj.weight_scale": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.gate.e_score_correction_bias": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.gate.weight": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.shared_experts.down_proj.weight": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.shared_experts.down_proj.weight_scale": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.shared_experts.gate_proj.weight": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.shared_experts.gate_proj.weight_scale": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.shared_experts.up_proj.weight": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.shared_experts.up_proj.weight_scale": "model-00044-of-00092.safetensors",
+ "model.layers.43.post_attention_layernorm.weight": "model-00044-of-00092.safetensors",
+ "model.layers.43.self_attn.k_norm.weight": "model-00044-of-00092.safetensors",
+ "model.layers.43.self_attn.k_proj.bias": "model-00044-of-00092.safetensors",
+ "model.layers.43.self_attn.k_proj.weight": "model-00044-of-00092.safetensors",
+ "model.layers.43.self_attn.k_proj.weight_scale": "model-00044-of-00092.safetensors",
+ "model.layers.43.self_attn.o_proj.weight": "model-00044-of-00092.safetensors",
+ "model.layers.43.self_attn.o_proj.weight_scale": "model-00044-of-00092.safetensors",
+ "model.layers.43.self_attn.q_norm.weight": "model-00044-of-00092.safetensors",
+ "model.layers.43.self_attn.q_proj.bias": "model-00044-of-00092.safetensors",
+ "model.layers.43.self_attn.q_proj.weight": "model-00044-of-00092.safetensors",
+ "model.layers.43.self_attn.q_proj.weight_scale": "model-00044-of-00092.safetensors",
+ "model.layers.43.self_attn.v_proj.bias": "model-00044-of-00092.safetensors",
+ "model.layers.43.self_attn.v_proj.weight": "model-00044-of-00092.safetensors",
+ "model.layers.43.self_attn.v_proj.weight_scale": "model-00044-of-00092.safetensors",
+ "model.layers.44.input_layernorm.weight": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.0.down_proj.weight": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.0.down_proj.weight_scale": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.0.gate_proj.weight": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.0.gate_proj.weight_scale": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.0.up_proj.weight": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.0.up_proj.weight_scale": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.1.down_proj.weight": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.1.down_proj.weight_scale": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.1.gate_proj.weight": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.1.gate_proj.weight_scale": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.1.up_proj.weight": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.1.up_proj.weight_scale": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.10.down_proj.weight": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.10.down_proj.weight_scale": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.10.gate_proj.weight": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.10.gate_proj.weight_scale": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.10.up_proj.weight": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.10.up_proj.weight_scale": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.100.down_proj.weight": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.100.down_proj.weight_scale": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.100.gate_proj.weight": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.100.gate_proj.weight_scale": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.100.up_proj.weight": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.100.up_proj.weight_scale": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.101.down_proj.weight": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.101.down_proj.weight_scale": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.101.gate_proj.weight": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.101.gate_proj.weight_scale": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.101.up_proj.weight": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.101.up_proj.weight_scale": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.102.down_proj.weight": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.102.down_proj.weight_scale": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.102.gate_proj.weight": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.102.gate_proj.weight_scale": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.102.up_proj.weight": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.102.up_proj.weight_scale": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.103.down_proj.weight": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.103.down_proj.weight_scale": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.103.gate_proj.weight": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.103.gate_proj.weight_scale": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.103.up_proj.weight": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.103.up_proj.weight_scale": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.104.down_proj.weight": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.104.down_proj.weight_scale": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.104.gate_proj.weight": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.104.gate_proj.weight_scale": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.104.up_proj.weight": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.104.up_proj.weight_scale": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.105.down_proj.weight": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.105.down_proj.weight_scale": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.105.gate_proj.weight": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.105.gate_proj.weight_scale": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.105.up_proj.weight": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.105.up_proj.weight_scale": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.106.down_proj.weight": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.106.down_proj.weight_scale": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.106.gate_proj.weight": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.106.gate_proj.weight_scale": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.106.up_proj.weight": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.106.up_proj.weight_scale": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.107.down_proj.weight": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.107.down_proj.weight_scale": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.107.gate_proj.weight": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.107.gate_proj.weight_scale": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.107.up_proj.weight": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.107.up_proj.weight_scale": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.108.down_proj.weight": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.108.down_proj.weight_scale": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.108.gate_proj.weight": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.108.gate_proj.weight_scale": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.108.up_proj.weight": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.108.up_proj.weight_scale": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.109.down_proj.weight": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.109.down_proj.weight_scale": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.109.gate_proj.weight": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.109.gate_proj.weight_scale": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.109.up_proj.weight": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.109.up_proj.weight_scale": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.11.down_proj.weight": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.11.down_proj.weight_scale": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.11.gate_proj.weight": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.11.gate_proj.weight_scale": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.11.up_proj.weight": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.11.up_proj.weight_scale": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.110.down_proj.weight": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.110.down_proj.weight_scale": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.110.gate_proj.weight": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.110.gate_proj.weight_scale": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.110.up_proj.weight": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.110.up_proj.weight_scale": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.111.down_proj.weight": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.111.down_proj.weight_scale": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.111.gate_proj.weight": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.111.gate_proj.weight_scale": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.111.up_proj.weight": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.111.up_proj.weight_scale": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.112.down_proj.weight": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.112.down_proj.weight_scale": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.112.gate_proj.weight": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.112.gate_proj.weight_scale": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.112.up_proj.weight": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.112.up_proj.weight_scale": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.113.down_proj.weight": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.113.down_proj.weight_scale": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.113.gate_proj.weight": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.113.gate_proj.weight_scale": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.113.up_proj.weight": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.113.up_proj.weight_scale": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.114.down_proj.weight": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.114.down_proj.weight_scale": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.114.gate_proj.weight": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.114.gate_proj.weight_scale": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.114.up_proj.weight": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.114.up_proj.weight_scale": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.115.down_proj.weight": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.115.down_proj.weight_scale": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.115.gate_proj.weight": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.115.gate_proj.weight_scale": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.115.up_proj.weight": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.115.up_proj.weight_scale": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.116.down_proj.weight": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.116.down_proj.weight_scale": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.116.gate_proj.weight": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.116.gate_proj.weight_scale": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.116.up_proj.weight": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.116.up_proj.weight_scale": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.117.down_proj.weight": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.117.down_proj.weight_scale": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.117.gate_proj.weight": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.117.gate_proj.weight_scale": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.117.up_proj.weight": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.117.up_proj.weight_scale": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.118.down_proj.weight": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.118.down_proj.weight_scale": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.118.gate_proj.weight": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.118.gate_proj.weight_scale": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.118.up_proj.weight": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.118.up_proj.weight_scale": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.119.down_proj.weight": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.119.down_proj.weight_scale": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.119.gate_proj.weight": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.119.gate_proj.weight_scale": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.119.up_proj.weight": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.119.up_proj.weight_scale": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.12.down_proj.weight": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.12.down_proj.weight_scale": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.12.gate_proj.weight": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.12.gate_proj.weight_scale": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.12.up_proj.weight": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.12.up_proj.weight_scale": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.120.down_proj.weight": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.120.down_proj.weight_scale": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.120.gate_proj.weight": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.120.gate_proj.weight_scale": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.120.up_proj.weight": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.120.up_proj.weight_scale": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.121.down_proj.weight": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.121.down_proj.weight_scale": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.121.gate_proj.weight": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.121.gate_proj.weight_scale": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.121.up_proj.weight": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.121.up_proj.weight_scale": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.122.down_proj.weight": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.122.down_proj.weight_scale": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.122.gate_proj.weight": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.122.gate_proj.weight_scale": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.122.up_proj.weight": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.122.up_proj.weight_scale": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.123.down_proj.weight": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.123.down_proj.weight_scale": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.123.gate_proj.weight": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.123.gate_proj.weight_scale": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.123.up_proj.weight": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.123.up_proj.weight_scale": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.124.down_proj.weight": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.124.down_proj.weight_scale": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.124.gate_proj.weight": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.124.gate_proj.weight_scale": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.124.up_proj.weight": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.124.up_proj.weight_scale": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.125.down_proj.weight": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.125.down_proj.weight_scale": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.125.gate_proj.weight": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.125.gate_proj.weight_scale": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.125.up_proj.weight": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.125.up_proj.weight_scale": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.126.down_proj.weight": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.126.down_proj.weight_scale": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.126.gate_proj.weight": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.126.gate_proj.weight_scale": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.126.up_proj.weight": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.126.up_proj.weight_scale": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.127.down_proj.weight": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.127.down_proj.weight_scale": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.127.gate_proj.weight": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.127.gate_proj.weight_scale": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.127.up_proj.weight": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.127.up_proj.weight_scale": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.128.down_proj.weight": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.128.down_proj.weight_scale": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.128.gate_proj.weight": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.128.gate_proj.weight_scale": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.128.up_proj.weight": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.128.up_proj.weight_scale": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.129.down_proj.weight": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.129.down_proj.weight_scale": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.129.gate_proj.weight": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.129.gate_proj.weight_scale": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.129.up_proj.weight": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.129.up_proj.weight_scale": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.13.down_proj.weight": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.13.down_proj.weight_scale": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.13.gate_proj.weight": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.13.gate_proj.weight_scale": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.13.up_proj.weight": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.13.up_proj.weight_scale": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.130.down_proj.weight": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.130.down_proj.weight_scale": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.130.gate_proj.weight": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.130.gate_proj.weight_scale": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.130.up_proj.weight": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.130.up_proj.weight_scale": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.131.down_proj.weight": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.131.down_proj.weight_scale": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.131.gate_proj.weight": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.131.gate_proj.weight_scale": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.131.up_proj.weight": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.131.up_proj.weight_scale": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.132.down_proj.weight": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.132.down_proj.weight_scale": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.132.gate_proj.weight": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.132.gate_proj.weight_scale": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.132.up_proj.weight": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.132.up_proj.weight_scale": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.133.down_proj.weight": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.133.down_proj.weight_scale": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.133.gate_proj.weight": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.133.gate_proj.weight_scale": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.133.up_proj.weight": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.133.up_proj.weight_scale": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.134.down_proj.weight": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.134.down_proj.weight_scale": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.134.gate_proj.weight": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.134.gate_proj.weight_scale": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.134.up_proj.weight": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.134.up_proj.weight_scale": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.135.down_proj.weight": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.135.down_proj.weight_scale": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.135.gate_proj.weight": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.135.gate_proj.weight_scale": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.135.up_proj.weight": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.135.up_proj.weight_scale": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.136.down_proj.weight": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.136.down_proj.weight_scale": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.136.gate_proj.weight": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.136.gate_proj.weight_scale": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.136.up_proj.weight": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.136.up_proj.weight_scale": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.137.down_proj.weight": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.137.down_proj.weight_scale": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.137.gate_proj.weight": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.137.gate_proj.weight_scale": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.137.up_proj.weight": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.137.up_proj.weight_scale": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.138.down_proj.weight": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.138.down_proj.weight_scale": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.138.gate_proj.weight": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.138.gate_proj.weight_scale": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.138.up_proj.weight": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.138.up_proj.weight_scale": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.139.down_proj.weight": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.139.down_proj.weight_scale": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.139.gate_proj.weight": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.139.gate_proj.weight_scale": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.139.up_proj.weight": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.139.up_proj.weight_scale": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.14.down_proj.weight": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.14.down_proj.weight_scale": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.14.gate_proj.weight": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.14.gate_proj.weight_scale": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.14.up_proj.weight": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.14.up_proj.weight_scale": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.140.down_proj.weight": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.140.down_proj.weight_scale": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.140.gate_proj.weight": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.140.gate_proj.weight_scale": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.140.up_proj.weight": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.140.up_proj.weight_scale": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.141.down_proj.weight": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.141.down_proj.weight_scale": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.141.gate_proj.weight": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.141.gate_proj.weight_scale": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.141.up_proj.weight": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.141.up_proj.weight_scale": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.142.down_proj.weight": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.142.down_proj.weight_scale": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.142.gate_proj.weight": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.142.gate_proj.weight_scale": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.142.up_proj.weight": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.142.up_proj.weight_scale": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.143.down_proj.weight": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.143.down_proj.weight_scale": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.143.gate_proj.weight": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.143.gate_proj.weight_scale": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.143.up_proj.weight": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.143.up_proj.weight_scale": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.144.down_proj.weight": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.144.down_proj.weight_scale": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.144.gate_proj.weight": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.144.gate_proj.weight_scale": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.144.up_proj.weight": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.144.up_proj.weight_scale": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.145.down_proj.weight": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.145.down_proj.weight_scale": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.145.gate_proj.weight": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.145.gate_proj.weight_scale": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.145.up_proj.weight": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.145.up_proj.weight_scale": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.146.down_proj.weight": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.146.down_proj.weight_scale": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.146.gate_proj.weight": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.146.gate_proj.weight_scale": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.146.up_proj.weight": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.146.up_proj.weight_scale": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.147.down_proj.weight": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.147.down_proj.weight_scale": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.147.gate_proj.weight": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.147.gate_proj.weight_scale": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.147.up_proj.weight": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.147.up_proj.weight_scale": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.148.down_proj.weight": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.148.down_proj.weight_scale": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.148.gate_proj.weight": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.148.gate_proj.weight_scale": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.148.up_proj.weight": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.148.up_proj.weight_scale": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.149.down_proj.weight": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.149.down_proj.weight_scale": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.149.gate_proj.weight": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.149.gate_proj.weight_scale": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.149.up_proj.weight": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.149.up_proj.weight_scale": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.15.down_proj.weight": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.15.down_proj.weight_scale": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.15.gate_proj.weight": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.15.gate_proj.weight_scale": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.15.up_proj.weight": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.15.up_proj.weight_scale": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.150.down_proj.weight": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.150.down_proj.weight_scale": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.150.gate_proj.weight": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.150.gate_proj.weight_scale": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.150.up_proj.weight": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.150.up_proj.weight_scale": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.151.down_proj.weight": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.151.down_proj.weight_scale": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.151.gate_proj.weight": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.151.gate_proj.weight_scale": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.151.up_proj.weight": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.151.up_proj.weight_scale": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.152.down_proj.weight": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.152.down_proj.weight_scale": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.152.gate_proj.weight": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.152.gate_proj.weight_scale": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.152.up_proj.weight": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.152.up_proj.weight_scale": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.153.down_proj.weight": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.153.down_proj.weight_scale": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.153.gate_proj.weight": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.153.gate_proj.weight_scale": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.153.up_proj.weight": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.153.up_proj.weight_scale": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.154.down_proj.weight": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.154.down_proj.weight_scale": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.154.gate_proj.weight": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.154.gate_proj.weight_scale": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.154.up_proj.weight": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.154.up_proj.weight_scale": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.155.down_proj.weight": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.155.down_proj.weight_scale": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.155.gate_proj.weight": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.155.gate_proj.weight_scale": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.155.up_proj.weight": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.155.up_proj.weight_scale": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.156.down_proj.weight": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.156.down_proj.weight_scale": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.156.gate_proj.weight": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.156.gate_proj.weight_scale": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.156.up_proj.weight": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.156.up_proj.weight_scale": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.157.down_proj.weight": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.157.down_proj.weight_scale": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.157.gate_proj.weight": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.157.gate_proj.weight_scale": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.157.up_proj.weight": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.157.up_proj.weight_scale": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.158.down_proj.weight": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.158.down_proj.weight_scale": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.158.gate_proj.weight": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.158.gate_proj.weight_scale": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.158.up_proj.weight": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.158.up_proj.weight_scale": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.159.down_proj.weight": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.159.down_proj.weight_scale": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.159.gate_proj.weight": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.159.gate_proj.weight_scale": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.159.up_proj.weight": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.159.up_proj.weight_scale": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.16.down_proj.weight": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.16.down_proj.weight_scale": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.16.gate_proj.weight": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.16.gate_proj.weight_scale": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.16.up_proj.weight": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.16.up_proj.weight_scale": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.17.down_proj.weight": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.17.down_proj.weight_scale": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.17.gate_proj.weight": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.17.gate_proj.weight_scale": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.17.up_proj.weight": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.17.up_proj.weight_scale": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.18.down_proj.weight": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.18.down_proj.weight_scale": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.18.gate_proj.weight": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.18.gate_proj.weight_scale": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.18.up_proj.weight": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.18.up_proj.weight_scale": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.19.down_proj.weight": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.19.down_proj.weight_scale": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.19.gate_proj.weight": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.19.gate_proj.weight_scale": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.19.up_proj.weight": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.19.up_proj.weight_scale": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.2.down_proj.weight": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.2.down_proj.weight_scale": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.2.gate_proj.weight": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.2.gate_proj.weight_scale": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.2.up_proj.weight": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.2.up_proj.weight_scale": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.20.down_proj.weight": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.20.down_proj.weight_scale": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.20.gate_proj.weight": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.20.gate_proj.weight_scale": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.20.up_proj.weight": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.20.up_proj.weight_scale": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.21.down_proj.weight": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.21.down_proj.weight_scale": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.21.gate_proj.weight": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.21.gate_proj.weight_scale": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.21.up_proj.weight": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.21.up_proj.weight_scale": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.22.down_proj.weight": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.22.down_proj.weight_scale": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.22.gate_proj.weight": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.22.gate_proj.weight_scale": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.22.up_proj.weight": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.22.up_proj.weight_scale": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.23.down_proj.weight": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.23.down_proj.weight_scale": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.23.gate_proj.weight": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.23.gate_proj.weight_scale": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.23.up_proj.weight": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.23.up_proj.weight_scale": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.24.down_proj.weight": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.24.down_proj.weight_scale": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.24.gate_proj.weight": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.24.gate_proj.weight_scale": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.24.up_proj.weight": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.24.up_proj.weight_scale": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.25.down_proj.weight": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.25.down_proj.weight_scale": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.25.gate_proj.weight": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.25.gate_proj.weight_scale": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.25.up_proj.weight": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.25.up_proj.weight_scale": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.26.down_proj.weight": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.26.down_proj.weight_scale": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.26.gate_proj.weight": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.26.gate_proj.weight_scale": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.26.up_proj.weight": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.26.up_proj.weight_scale": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.27.down_proj.weight": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.27.down_proj.weight_scale": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.27.gate_proj.weight": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.27.gate_proj.weight_scale": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.27.up_proj.weight": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.27.up_proj.weight_scale": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.28.down_proj.weight": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.28.down_proj.weight_scale": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.28.gate_proj.weight": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.28.gate_proj.weight_scale": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.28.up_proj.weight": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.28.up_proj.weight_scale": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.29.down_proj.weight": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.29.down_proj.weight_scale": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.29.gate_proj.weight": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.29.gate_proj.weight_scale": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.29.up_proj.weight": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.29.up_proj.weight_scale": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.3.down_proj.weight": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.3.down_proj.weight_scale": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.3.gate_proj.weight": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.3.gate_proj.weight_scale": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.3.up_proj.weight": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.3.up_proj.weight_scale": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.30.down_proj.weight": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.30.down_proj.weight_scale": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.30.gate_proj.weight": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.30.gate_proj.weight_scale": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.30.up_proj.weight": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.30.up_proj.weight_scale": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.31.down_proj.weight": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.31.down_proj.weight_scale": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.31.gate_proj.weight": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.31.gate_proj.weight_scale": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.31.up_proj.weight": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.31.up_proj.weight_scale": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.32.down_proj.weight": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.32.down_proj.weight_scale": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.32.gate_proj.weight": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.32.gate_proj.weight_scale": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.32.up_proj.weight": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.32.up_proj.weight_scale": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.33.down_proj.weight": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.33.down_proj.weight_scale": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.33.gate_proj.weight": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.33.gate_proj.weight_scale": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.33.up_proj.weight": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.33.up_proj.weight_scale": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.34.down_proj.weight": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.34.down_proj.weight_scale": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.34.gate_proj.weight": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.34.gate_proj.weight_scale": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.34.up_proj.weight": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.34.up_proj.weight_scale": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.35.down_proj.weight": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.35.down_proj.weight_scale": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.35.gate_proj.weight": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.35.gate_proj.weight_scale": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.35.up_proj.weight": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.35.up_proj.weight_scale": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.36.down_proj.weight": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.36.down_proj.weight_scale": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.36.gate_proj.weight": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.36.gate_proj.weight_scale": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.36.up_proj.weight": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.36.up_proj.weight_scale": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.37.down_proj.weight": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.37.down_proj.weight_scale": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.37.gate_proj.weight": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.37.gate_proj.weight_scale": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.37.up_proj.weight": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.37.up_proj.weight_scale": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.38.down_proj.weight": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.38.down_proj.weight_scale": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.38.gate_proj.weight": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.38.gate_proj.weight_scale": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.38.up_proj.weight": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.38.up_proj.weight_scale": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.39.down_proj.weight": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.39.down_proj.weight_scale": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.39.gate_proj.weight": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.39.gate_proj.weight_scale": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.39.up_proj.weight": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.39.up_proj.weight_scale": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.4.down_proj.weight": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.4.down_proj.weight_scale": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.4.gate_proj.weight": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.4.gate_proj.weight_scale": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.4.up_proj.weight": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.4.up_proj.weight_scale": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.40.down_proj.weight": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.40.down_proj.weight_scale": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.40.gate_proj.weight": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.40.gate_proj.weight_scale": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.40.up_proj.weight": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.40.up_proj.weight_scale": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.41.down_proj.weight": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.41.down_proj.weight_scale": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.41.gate_proj.weight": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.41.gate_proj.weight_scale": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.41.up_proj.weight": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.41.up_proj.weight_scale": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.42.down_proj.weight": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.42.down_proj.weight_scale": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.42.gate_proj.weight": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.42.gate_proj.weight_scale": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.42.up_proj.weight": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.42.up_proj.weight_scale": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.43.down_proj.weight": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.43.down_proj.weight_scale": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.43.gate_proj.weight": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.43.gate_proj.weight_scale": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.43.up_proj.weight": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.43.up_proj.weight_scale": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.44.down_proj.weight": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.44.down_proj.weight_scale": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.44.gate_proj.weight": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.44.gate_proj.weight_scale": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.44.up_proj.weight": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.44.up_proj.weight_scale": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.45.down_proj.weight": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.45.down_proj.weight_scale": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.45.gate_proj.weight": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.45.gate_proj.weight_scale": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.45.up_proj.weight": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.45.up_proj.weight_scale": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.46.down_proj.weight": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.46.down_proj.weight_scale": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.46.gate_proj.weight": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.46.gate_proj.weight_scale": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.46.up_proj.weight": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.46.up_proj.weight_scale": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.47.down_proj.weight": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.47.down_proj.weight_scale": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.47.gate_proj.weight": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.47.gate_proj.weight_scale": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.47.up_proj.weight": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.47.up_proj.weight_scale": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.48.down_proj.weight": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.48.down_proj.weight_scale": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.48.gate_proj.weight": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.48.gate_proj.weight_scale": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.48.up_proj.weight": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.48.up_proj.weight_scale": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.49.down_proj.weight": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.49.down_proj.weight_scale": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.49.gate_proj.weight": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.49.gate_proj.weight_scale": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.49.up_proj.weight": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.49.up_proj.weight_scale": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.5.down_proj.weight": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.5.down_proj.weight_scale": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.5.gate_proj.weight": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.5.gate_proj.weight_scale": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.5.up_proj.weight": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.5.up_proj.weight_scale": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.50.down_proj.weight": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.50.down_proj.weight_scale": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.50.gate_proj.weight": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.50.gate_proj.weight_scale": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.50.up_proj.weight": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.50.up_proj.weight_scale": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.51.down_proj.weight": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.51.down_proj.weight_scale": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.51.gate_proj.weight": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.51.gate_proj.weight_scale": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.51.up_proj.weight": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.51.up_proj.weight_scale": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.52.down_proj.weight": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.52.down_proj.weight_scale": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.52.gate_proj.weight": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.52.gate_proj.weight_scale": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.52.up_proj.weight": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.52.up_proj.weight_scale": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.53.down_proj.weight": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.53.down_proj.weight_scale": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.53.gate_proj.weight": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.53.gate_proj.weight_scale": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.53.up_proj.weight": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.53.up_proj.weight_scale": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.54.down_proj.weight": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.54.down_proj.weight_scale": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.54.gate_proj.weight": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.54.gate_proj.weight_scale": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.54.up_proj.weight": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.54.up_proj.weight_scale": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.55.down_proj.weight": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.55.down_proj.weight_scale": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.55.gate_proj.weight": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.55.gate_proj.weight_scale": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.55.up_proj.weight": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.55.up_proj.weight_scale": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.56.down_proj.weight": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.56.down_proj.weight_scale": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.56.gate_proj.weight": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.56.gate_proj.weight_scale": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.56.up_proj.weight": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.56.up_proj.weight_scale": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.57.down_proj.weight": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.57.down_proj.weight_scale": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.57.gate_proj.weight": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.57.gate_proj.weight_scale": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.57.up_proj.weight": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.57.up_proj.weight_scale": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.58.down_proj.weight": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.58.down_proj.weight_scale": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.58.gate_proj.weight": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.58.gate_proj.weight_scale": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.58.up_proj.weight": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.58.up_proj.weight_scale": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.59.down_proj.weight": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.59.down_proj.weight_scale": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.59.gate_proj.weight": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.59.gate_proj.weight_scale": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.59.up_proj.weight": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.59.up_proj.weight_scale": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.6.down_proj.weight": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.6.down_proj.weight_scale": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.6.gate_proj.weight": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.6.gate_proj.weight_scale": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.6.up_proj.weight": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.6.up_proj.weight_scale": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.60.down_proj.weight": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.60.down_proj.weight_scale": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.60.gate_proj.weight": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.60.gate_proj.weight_scale": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.60.up_proj.weight": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.60.up_proj.weight_scale": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.61.down_proj.weight": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.61.down_proj.weight_scale": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.61.gate_proj.weight": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.61.gate_proj.weight_scale": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.61.up_proj.weight": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.61.up_proj.weight_scale": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.62.down_proj.weight": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.62.down_proj.weight_scale": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.62.gate_proj.weight": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.62.gate_proj.weight_scale": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.62.up_proj.weight": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.62.up_proj.weight_scale": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.63.down_proj.weight": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.63.down_proj.weight_scale": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.63.gate_proj.weight": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.63.gate_proj.weight_scale": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.63.up_proj.weight": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.63.up_proj.weight_scale": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.64.down_proj.weight": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.64.down_proj.weight_scale": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.64.gate_proj.weight": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.64.gate_proj.weight_scale": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.64.up_proj.weight": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.64.up_proj.weight_scale": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.65.down_proj.weight": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.65.down_proj.weight_scale": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.65.gate_proj.weight": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.65.gate_proj.weight_scale": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.65.up_proj.weight": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.65.up_proj.weight_scale": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.66.down_proj.weight": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.66.down_proj.weight_scale": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.66.gate_proj.weight": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.66.gate_proj.weight_scale": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.66.up_proj.weight": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.66.up_proj.weight_scale": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.67.down_proj.weight": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.67.down_proj.weight_scale": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.67.gate_proj.weight": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.67.gate_proj.weight_scale": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.67.up_proj.weight": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.67.up_proj.weight_scale": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.68.down_proj.weight": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.68.down_proj.weight_scale": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.68.gate_proj.weight": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.68.gate_proj.weight_scale": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.68.up_proj.weight": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.68.up_proj.weight_scale": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.69.down_proj.weight": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.69.down_proj.weight_scale": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.69.gate_proj.weight": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.69.gate_proj.weight_scale": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.69.up_proj.weight": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.69.up_proj.weight_scale": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.7.down_proj.weight": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.7.down_proj.weight_scale": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.7.gate_proj.weight": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.7.gate_proj.weight_scale": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.7.up_proj.weight": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.7.up_proj.weight_scale": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.70.down_proj.weight": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.70.down_proj.weight_scale": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.70.gate_proj.weight": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.70.gate_proj.weight_scale": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.70.up_proj.weight": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.70.up_proj.weight_scale": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.71.down_proj.weight": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.71.down_proj.weight_scale": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.71.gate_proj.weight": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.71.gate_proj.weight_scale": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.71.up_proj.weight": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.71.up_proj.weight_scale": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.72.down_proj.weight": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.72.down_proj.weight_scale": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.72.gate_proj.weight": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.72.gate_proj.weight_scale": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.72.up_proj.weight": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.72.up_proj.weight_scale": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.73.down_proj.weight": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.73.down_proj.weight_scale": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.73.gate_proj.weight": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.73.gate_proj.weight_scale": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.73.up_proj.weight": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.73.up_proj.weight_scale": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.74.down_proj.weight": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.74.down_proj.weight_scale": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.74.gate_proj.weight": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.74.gate_proj.weight_scale": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.74.up_proj.weight": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.74.up_proj.weight_scale": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.75.down_proj.weight": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.75.down_proj.weight_scale": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.75.gate_proj.weight": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.75.gate_proj.weight_scale": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.75.up_proj.weight": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.75.up_proj.weight_scale": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.76.down_proj.weight": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.76.down_proj.weight_scale": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.76.gate_proj.weight": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.76.gate_proj.weight_scale": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.76.up_proj.weight": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.76.up_proj.weight_scale": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.77.down_proj.weight": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.77.down_proj.weight_scale": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.77.gate_proj.weight": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.77.gate_proj.weight_scale": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.77.up_proj.weight": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.77.up_proj.weight_scale": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.78.down_proj.weight": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.78.down_proj.weight_scale": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.78.gate_proj.weight": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.78.gate_proj.weight_scale": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.78.up_proj.weight": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.78.up_proj.weight_scale": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.79.down_proj.weight": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.79.down_proj.weight_scale": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.79.gate_proj.weight": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.79.gate_proj.weight_scale": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.79.up_proj.weight": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.79.up_proj.weight_scale": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.8.down_proj.weight": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.8.down_proj.weight_scale": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.8.gate_proj.weight": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.8.gate_proj.weight_scale": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.8.up_proj.weight": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.8.up_proj.weight_scale": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.80.down_proj.weight": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.80.down_proj.weight_scale": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.80.gate_proj.weight": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.80.gate_proj.weight_scale": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.80.up_proj.weight": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.80.up_proj.weight_scale": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.81.down_proj.weight": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.81.down_proj.weight_scale": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.81.gate_proj.weight": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.81.gate_proj.weight_scale": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.81.up_proj.weight": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.81.up_proj.weight_scale": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.82.down_proj.weight": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.82.down_proj.weight_scale": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.82.gate_proj.weight": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.82.gate_proj.weight_scale": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.82.up_proj.weight": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.82.up_proj.weight_scale": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.83.down_proj.weight": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.83.down_proj.weight_scale": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.83.gate_proj.weight": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.83.gate_proj.weight_scale": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.83.up_proj.weight": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.83.up_proj.weight_scale": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.84.down_proj.weight": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.84.down_proj.weight_scale": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.84.gate_proj.weight": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.84.gate_proj.weight_scale": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.84.up_proj.weight": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.84.up_proj.weight_scale": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.85.down_proj.weight": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.85.down_proj.weight_scale": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.85.gate_proj.weight": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.85.gate_proj.weight_scale": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.85.up_proj.weight": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.85.up_proj.weight_scale": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.86.down_proj.weight": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.86.down_proj.weight_scale": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.86.gate_proj.weight": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.86.gate_proj.weight_scale": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.86.up_proj.weight": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.86.up_proj.weight_scale": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.87.down_proj.weight": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.87.down_proj.weight_scale": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.87.gate_proj.weight": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.87.gate_proj.weight_scale": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.87.up_proj.weight": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.87.up_proj.weight_scale": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.88.down_proj.weight": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.88.down_proj.weight_scale": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.88.gate_proj.weight": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.88.gate_proj.weight_scale": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.88.up_proj.weight": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.88.up_proj.weight_scale": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.89.down_proj.weight": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.89.down_proj.weight_scale": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.89.gate_proj.weight": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.89.gate_proj.weight_scale": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.89.up_proj.weight": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.89.up_proj.weight_scale": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.9.down_proj.weight": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.9.down_proj.weight_scale": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.9.gate_proj.weight": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.9.gate_proj.weight_scale": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.9.up_proj.weight": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.9.up_proj.weight_scale": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.90.down_proj.weight": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.90.down_proj.weight_scale": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.90.gate_proj.weight": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.90.gate_proj.weight_scale": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.90.up_proj.weight": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.90.up_proj.weight_scale": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.91.down_proj.weight": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.91.down_proj.weight_scale": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.91.gate_proj.weight": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.91.gate_proj.weight_scale": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.91.up_proj.weight": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.91.up_proj.weight_scale": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.92.down_proj.weight": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.92.down_proj.weight_scale": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.92.gate_proj.weight": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.92.gate_proj.weight_scale": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.92.up_proj.weight": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.92.up_proj.weight_scale": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.93.down_proj.weight": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.93.down_proj.weight_scale": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.93.gate_proj.weight": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.93.gate_proj.weight_scale": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.93.up_proj.weight": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.93.up_proj.weight_scale": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.94.down_proj.weight": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.94.down_proj.weight_scale": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.94.gate_proj.weight": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.94.gate_proj.weight_scale": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.94.up_proj.weight": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.94.up_proj.weight_scale": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.95.down_proj.weight": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.95.down_proj.weight_scale": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.95.gate_proj.weight": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.95.gate_proj.weight_scale": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.95.up_proj.weight": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.95.up_proj.weight_scale": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.96.down_proj.weight": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.96.down_proj.weight_scale": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.96.gate_proj.weight": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.96.gate_proj.weight_scale": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.96.up_proj.weight": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.96.up_proj.weight_scale": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.97.down_proj.weight": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.97.down_proj.weight_scale": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.97.gate_proj.weight": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.97.gate_proj.weight_scale": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.97.up_proj.weight": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.97.up_proj.weight_scale": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.98.down_proj.weight": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.98.down_proj.weight_scale": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.98.gate_proj.weight": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.98.gate_proj.weight_scale": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.98.up_proj.weight": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.98.up_proj.weight_scale": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.99.down_proj.weight": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.99.down_proj.weight_scale": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.99.gate_proj.weight": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.99.gate_proj.weight_scale": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.99.up_proj.weight": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.99.up_proj.weight_scale": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.gate.e_score_correction_bias": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.gate.weight": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.shared_experts.down_proj.weight": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.shared_experts.down_proj.weight_scale": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.shared_experts.gate_proj.weight": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.shared_experts.gate_proj.weight_scale": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.shared_experts.up_proj.weight": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.shared_experts.up_proj.weight_scale": "model-00045-of-00092.safetensors",
+ "model.layers.44.post_attention_layernorm.weight": "model-00045-of-00092.safetensors",
+ "model.layers.44.self_attn.k_norm.weight": "model-00045-of-00092.safetensors",
+ "model.layers.44.self_attn.k_proj.bias": "model-00045-of-00092.safetensors",
+ "model.layers.44.self_attn.k_proj.weight": "model-00045-of-00092.safetensors",
+ "model.layers.44.self_attn.k_proj.weight_scale": "model-00045-of-00092.safetensors",
+ "model.layers.44.self_attn.o_proj.weight": "model-00045-of-00092.safetensors",
+ "model.layers.44.self_attn.o_proj.weight_scale": "model-00045-of-00092.safetensors",
+ "model.layers.44.self_attn.q_norm.weight": "model-00045-of-00092.safetensors",
+ "model.layers.44.self_attn.q_proj.bias": "model-00045-of-00092.safetensors",
+ "model.layers.44.self_attn.q_proj.weight": "model-00045-of-00092.safetensors",
+ "model.layers.44.self_attn.q_proj.weight_scale": "model-00045-of-00092.safetensors",
+ "model.layers.44.self_attn.v_proj.bias": "model-00045-of-00092.safetensors",
+ "model.layers.44.self_attn.v_proj.weight": "model-00045-of-00092.safetensors",
+ "model.layers.44.self_attn.v_proj.weight_scale": "model-00045-of-00092.safetensors",
+ "model.layers.45.input_layernorm.weight": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.0.down_proj.weight": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.0.down_proj.weight_scale": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.0.gate_proj.weight": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.0.gate_proj.weight_scale": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.0.up_proj.weight": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.0.up_proj.weight_scale": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.1.down_proj.weight": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.1.down_proj.weight_scale": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.1.gate_proj.weight": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.1.gate_proj.weight_scale": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.1.up_proj.weight": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.1.up_proj.weight_scale": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.10.down_proj.weight": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.10.down_proj.weight_scale": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.10.gate_proj.weight": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.10.gate_proj.weight_scale": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.10.up_proj.weight": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.10.up_proj.weight_scale": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.100.down_proj.weight": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.100.down_proj.weight_scale": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.100.gate_proj.weight": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.100.gate_proj.weight_scale": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.100.up_proj.weight": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.100.up_proj.weight_scale": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.101.down_proj.weight": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.101.down_proj.weight_scale": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.101.gate_proj.weight": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.101.gate_proj.weight_scale": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.101.up_proj.weight": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.101.up_proj.weight_scale": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.102.down_proj.weight": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.102.down_proj.weight_scale": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.102.gate_proj.weight": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.102.gate_proj.weight_scale": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.102.up_proj.weight": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.102.up_proj.weight_scale": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.103.down_proj.weight": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.103.down_proj.weight_scale": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.103.gate_proj.weight": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.103.gate_proj.weight_scale": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.103.up_proj.weight": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.103.up_proj.weight_scale": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.104.down_proj.weight": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.104.down_proj.weight_scale": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.104.gate_proj.weight": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.104.gate_proj.weight_scale": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.104.up_proj.weight": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.104.up_proj.weight_scale": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.105.down_proj.weight": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.105.down_proj.weight_scale": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.105.gate_proj.weight": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.105.gate_proj.weight_scale": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.105.up_proj.weight": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.105.up_proj.weight_scale": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.106.down_proj.weight": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.106.down_proj.weight_scale": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.106.gate_proj.weight": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.106.gate_proj.weight_scale": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.106.up_proj.weight": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.106.up_proj.weight_scale": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.107.down_proj.weight": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.107.down_proj.weight_scale": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.107.gate_proj.weight": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.107.gate_proj.weight_scale": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.107.up_proj.weight": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.107.up_proj.weight_scale": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.108.down_proj.weight": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.108.down_proj.weight_scale": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.108.gate_proj.weight": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.108.gate_proj.weight_scale": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.108.up_proj.weight": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.108.up_proj.weight_scale": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.109.down_proj.weight": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.109.down_proj.weight_scale": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.109.gate_proj.weight": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.109.gate_proj.weight_scale": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.109.up_proj.weight": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.109.up_proj.weight_scale": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.11.down_proj.weight": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.11.down_proj.weight_scale": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.11.gate_proj.weight": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.11.gate_proj.weight_scale": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.11.up_proj.weight": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.11.up_proj.weight_scale": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.110.down_proj.weight": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.110.down_proj.weight_scale": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.110.gate_proj.weight": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.110.gate_proj.weight_scale": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.110.up_proj.weight": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.110.up_proj.weight_scale": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.111.down_proj.weight": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.111.down_proj.weight_scale": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.111.gate_proj.weight": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.111.gate_proj.weight_scale": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.111.up_proj.weight": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.111.up_proj.weight_scale": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.112.down_proj.weight": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.112.down_proj.weight_scale": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.112.gate_proj.weight": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.112.gate_proj.weight_scale": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.112.up_proj.weight": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.112.up_proj.weight_scale": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.113.down_proj.weight": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.113.down_proj.weight_scale": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.113.gate_proj.weight": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.113.gate_proj.weight_scale": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.113.up_proj.weight": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.113.up_proj.weight_scale": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.114.down_proj.weight": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.114.down_proj.weight_scale": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.114.gate_proj.weight": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.114.gate_proj.weight_scale": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.114.up_proj.weight": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.114.up_proj.weight_scale": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.115.down_proj.weight": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.115.down_proj.weight_scale": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.115.gate_proj.weight": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.115.gate_proj.weight_scale": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.115.up_proj.weight": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.115.up_proj.weight_scale": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.116.down_proj.weight": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.116.down_proj.weight_scale": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.116.gate_proj.weight": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.116.gate_proj.weight_scale": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.116.up_proj.weight": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.116.up_proj.weight_scale": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.117.down_proj.weight": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.117.down_proj.weight_scale": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.117.gate_proj.weight": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.117.gate_proj.weight_scale": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.117.up_proj.weight": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.117.up_proj.weight_scale": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.118.down_proj.weight": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.118.down_proj.weight_scale": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.118.gate_proj.weight": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.118.gate_proj.weight_scale": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.118.up_proj.weight": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.118.up_proj.weight_scale": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.119.down_proj.weight": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.119.down_proj.weight_scale": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.119.gate_proj.weight": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.119.gate_proj.weight_scale": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.119.up_proj.weight": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.119.up_proj.weight_scale": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.12.down_proj.weight": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.12.down_proj.weight_scale": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.12.gate_proj.weight": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.12.gate_proj.weight_scale": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.12.up_proj.weight": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.12.up_proj.weight_scale": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.120.down_proj.weight": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.120.down_proj.weight_scale": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.120.gate_proj.weight": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.120.gate_proj.weight_scale": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.120.up_proj.weight": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.120.up_proj.weight_scale": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.121.down_proj.weight": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.121.down_proj.weight_scale": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.121.gate_proj.weight": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.121.gate_proj.weight_scale": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.121.up_proj.weight": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.121.up_proj.weight_scale": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.122.down_proj.weight": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.122.down_proj.weight_scale": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.122.gate_proj.weight": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.122.gate_proj.weight_scale": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.122.up_proj.weight": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.122.up_proj.weight_scale": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.123.down_proj.weight": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.123.down_proj.weight_scale": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.123.gate_proj.weight": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.123.gate_proj.weight_scale": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.123.up_proj.weight": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.123.up_proj.weight_scale": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.124.down_proj.weight": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.124.down_proj.weight_scale": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.124.gate_proj.weight": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.124.gate_proj.weight_scale": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.124.up_proj.weight": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.124.up_proj.weight_scale": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.125.down_proj.weight": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.125.down_proj.weight_scale": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.125.gate_proj.weight": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.125.gate_proj.weight_scale": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.125.up_proj.weight": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.125.up_proj.weight_scale": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.126.down_proj.weight": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.126.down_proj.weight_scale": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.126.gate_proj.weight": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.126.gate_proj.weight_scale": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.126.up_proj.weight": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.126.up_proj.weight_scale": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.127.down_proj.weight": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.127.down_proj.weight_scale": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.127.gate_proj.weight": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.127.gate_proj.weight_scale": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.127.up_proj.weight": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.127.up_proj.weight_scale": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.128.down_proj.weight": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.128.down_proj.weight_scale": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.128.gate_proj.weight": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.128.gate_proj.weight_scale": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.128.up_proj.weight": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.128.up_proj.weight_scale": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.129.down_proj.weight": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.129.down_proj.weight_scale": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.129.gate_proj.weight": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.129.gate_proj.weight_scale": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.129.up_proj.weight": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.129.up_proj.weight_scale": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.13.down_proj.weight": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.13.down_proj.weight_scale": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.13.gate_proj.weight": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.13.gate_proj.weight_scale": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.13.up_proj.weight": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.13.up_proj.weight_scale": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.130.down_proj.weight": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.130.down_proj.weight_scale": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.130.gate_proj.weight": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.130.gate_proj.weight_scale": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.130.up_proj.weight": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.130.up_proj.weight_scale": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.131.down_proj.weight": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.131.down_proj.weight_scale": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.131.gate_proj.weight": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.131.gate_proj.weight_scale": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.131.up_proj.weight": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.131.up_proj.weight_scale": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.132.down_proj.weight": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.132.down_proj.weight_scale": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.132.gate_proj.weight": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.132.gate_proj.weight_scale": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.132.up_proj.weight": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.132.up_proj.weight_scale": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.133.down_proj.weight": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.133.down_proj.weight_scale": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.133.gate_proj.weight": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.133.gate_proj.weight_scale": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.133.up_proj.weight": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.133.up_proj.weight_scale": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.134.down_proj.weight": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.134.down_proj.weight_scale": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.134.gate_proj.weight": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.134.gate_proj.weight_scale": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.134.up_proj.weight": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.134.up_proj.weight_scale": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.135.down_proj.weight": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.135.down_proj.weight_scale": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.135.gate_proj.weight": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.135.gate_proj.weight_scale": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.135.up_proj.weight": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.135.up_proj.weight_scale": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.136.down_proj.weight": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.136.down_proj.weight_scale": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.136.gate_proj.weight": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.136.gate_proj.weight_scale": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.136.up_proj.weight": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.136.up_proj.weight_scale": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.137.down_proj.weight": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.137.down_proj.weight_scale": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.137.gate_proj.weight": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.137.gate_proj.weight_scale": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.137.up_proj.weight": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.137.up_proj.weight_scale": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.138.down_proj.weight": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.138.down_proj.weight_scale": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.138.gate_proj.weight": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.138.gate_proj.weight_scale": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.138.up_proj.weight": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.138.up_proj.weight_scale": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.139.down_proj.weight": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.139.down_proj.weight_scale": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.139.gate_proj.weight": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.139.gate_proj.weight_scale": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.139.up_proj.weight": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.139.up_proj.weight_scale": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.14.down_proj.weight": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.14.down_proj.weight_scale": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.14.gate_proj.weight": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.14.gate_proj.weight_scale": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.14.up_proj.weight": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.14.up_proj.weight_scale": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.140.down_proj.weight": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.140.down_proj.weight_scale": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.140.gate_proj.weight": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.140.gate_proj.weight_scale": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.140.up_proj.weight": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.140.up_proj.weight_scale": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.141.down_proj.weight": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.141.down_proj.weight_scale": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.141.gate_proj.weight": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.141.gate_proj.weight_scale": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.141.up_proj.weight": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.141.up_proj.weight_scale": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.142.down_proj.weight": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.142.down_proj.weight_scale": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.142.gate_proj.weight": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.142.gate_proj.weight_scale": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.142.up_proj.weight": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.142.up_proj.weight_scale": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.143.down_proj.weight": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.143.down_proj.weight_scale": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.143.gate_proj.weight": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.143.gate_proj.weight_scale": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.143.up_proj.weight": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.143.up_proj.weight_scale": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.144.down_proj.weight": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.144.down_proj.weight_scale": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.144.gate_proj.weight": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.144.gate_proj.weight_scale": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.144.up_proj.weight": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.144.up_proj.weight_scale": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.145.down_proj.weight": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.145.down_proj.weight_scale": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.145.gate_proj.weight": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.145.gate_proj.weight_scale": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.145.up_proj.weight": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.145.up_proj.weight_scale": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.146.down_proj.weight": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.146.down_proj.weight_scale": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.146.gate_proj.weight": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.146.gate_proj.weight_scale": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.146.up_proj.weight": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.146.up_proj.weight_scale": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.147.down_proj.weight": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.147.down_proj.weight_scale": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.147.gate_proj.weight": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.147.gate_proj.weight_scale": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.147.up_proj.weight": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.147.up_proj.weight_scale": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.148.down_proj.weight": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.148.down_proj.weight_scale": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.148.gate_proj.weight": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.148.gate_proj.weight_scale": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.148.up_proj.weight": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.148.up_proj.weight_scale": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.149.down_proj.weight": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.149.down_proj.weight_scale": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.149.gate_proj.weight": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.149.gate_proj.weight_scale": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.149.up_proj.weight": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.149.up_proj.weight_scale": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.15.down_proj.weight": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.15.down_proj.weight_scale": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.15.gate_proj.weight": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.15.gate_proj.weight_scale": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.15.up_proj.weight": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.15.up_proj.weight_scale": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.150.down_proj.weight": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.150.down_proj.weight_scale": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.150.gate_proj.weight": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.150.gate_proj.weight_scale": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.150.up_proj.weight": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.150.up_proj.weight_scale": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.151.down_proj.weight": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.151.down_proj.weight_scale": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.151.gate_proj.weight": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.151.gate_proj.weight_scale": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.151.up_proj.weight": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.151.up_proj.weight_scale": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.152.down_proj.weight": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.152.down_proj.weight_scale": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.152.gate_proj.weight": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.152.gate_proj.weight_scale": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.152.up_proj.weight": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.152.up_proj.weight_scale": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.153.down_proj.weight": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.153.down_proj.weight_scale": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.153.gate_proj.weight": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.153.gate_proj.weight_scale": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.153.up_proj.weight": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.153.up_proj.weight_scale": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.154.down_proj.weight": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.154.down_proj.weight_scale": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.154.gate_proj.weight": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.154.gate_proj.weight_scale": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.154.up_proj.weight": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.154.up_proj.weight_scale": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.155.down_proj.weight": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.155.down_proj.weight_scale": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.155.gate_proj.weight": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.155.gate_proj.weight_scale": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.155.up_proj.weight": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.155.up_proj.weight_scale": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.156.down_proj.weight": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.156.down_proj.weight_scale": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.156.gate_proj.weight": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.156.gate_proj.weight_scale": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.156.up_proj.weight": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.156.up_proj.weight_scale": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.157.down_proj.weight": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.157.down_proj.weight_scale": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.157.gate_proj.weight": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.157.gate_proj.weight_scale": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.157.up_proj.weight": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.157.up_proj.weight_scale": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.158.down_proj.weight": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.158.down_proj.weight_scale": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.158.gate_proj.weight": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.158.gate_proj.weight_scale": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.158.up_proj.weight": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.158.up_proj.weight_scale": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.159.down_proj.weight": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.159.down_proj.weight_scale": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.159.gate_proj.weight": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.159.gate_proj.weight_scale": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.159.up_proj.weight": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.159.up_proj.weight_scale": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.16.down_proj.weight": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.16.down_proj.weight_scale": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.16.gate_proj.weight": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.16.gate_proj.weight_scale": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.16.up_proj.weight": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.16.up_proj.weight_scale": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.17.down_proj.weight": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.17.down_proj.weight_scale": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.17.gate_proj.weight": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.17.gate_proj.weight_scale": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.17.up_proj.weight": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.17.up_proj.weight_scale": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.18.down_proj.weight": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.18.down_proj.weight_scale": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.18.gate_proj.weight": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.18.gate_proj.weight_scale": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.18.up_proj.weight": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.18.up_proj.weight_scale": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.19.down_proj.weight": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.19.down_proj.weight_scale": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.19.gate_proj.weight": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.19.gate_proj.weight_scale": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.19.up_proj.weight": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.19.up_proj.weight_scale": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.2.down_proj.weight": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.2.down_proj.weight_scale": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.2.gate_proj.weight": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.2.gate_proj.weight_scale": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.2.up_proj.weight": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.2.up_proj.weight_scale": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.20.down_proj.weight": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.20.down_proj.weight_scale": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.20.gate_proj.weight": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.20.gate_proj.weight_scale": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.20.up_proj.weight": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.20.up_proj.weight_scale": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.21.down_proj.weight": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.21.down_proj.weight_scale": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.21.gate_proj.weight": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.21.gate_proj.weight_scale": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.21.up_proj.weight": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.21.up_proj.weight_scale": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.22.down_proj.weight": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.22.down_proj.weight_scale": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.22.gate_proj.weight": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.22.gate_proj.weight_scale": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.22.up_proj.weight": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.22.up_proj.weight_scale": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.23.down_proj.weight": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.23.down_proj.weight_scale": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.23.gate_proj.weight": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.23.gate_proj.weight_scale": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.23.up_proj.weight": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.23.up_proj.weight_scale": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.24.down_proj.weight": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.24.down_proj.weight_scale": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.24.gate_proj.weight": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.24.gate_proj.weight_scale": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.24.up_proj.weight": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.24.up_proj.weight_scale": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.25.down_proj.weight": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.25.down_proj.weight_scale": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.25.gate_proj.weight": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.25.gate_proj.weight_scale": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.25.up_proj.weight": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.25.up_proj.weight_scale": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.26.down_proj.weight": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.26.down_proj.weight_scale": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.26.gate_proj.weight": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.26.gate_proj.weight_scale": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.26.up_proj.weight": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.26.up_proj.weight_scale": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.27.down_proj.weight": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.27.down_proj.weight_scale": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.27.gate_proj.weight": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.27.gate_proj.weight_scale": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.27.up_proj.weight": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.27.up_proj.weight_scale": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.28.down_proj.weight": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.28.down_proj.weight_scale": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.28.gate_proj.weight": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.28.gate_proj.weight_scale": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.28.up_proj.weight": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.28.up_proj.weight_scale": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.29.down_proj.weight": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.29.down_proj.weight_scale": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.29.gate_proj.weight": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.29.gate_proj.weight_scale": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.29.up_proj.weight": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.29.up_proj.weight_scale": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.3.down_proj.weight": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.3.down_proj.weight_scale": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.3.gate_proj.weight": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.3.gate_proj.weight_scale": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.3.up_proj.weight": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.3.up_proj.weight_scale": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.30.down_proj.weight": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.30.down_proj.weight_scale": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.30.gate_proj.weight": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.30.gate_proj.weight_scale": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.30.up_proj.weight": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.30.up_proj.weight_scale": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.31.down_proj.weight": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.31.down_proj.weight_scale": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.31.gate_proj.weight": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.31.gate_proj.weight_scale": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.31.up_proj.weight": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.31.up_proj.weight_scale": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.32.down_proj.weight": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.32.down_proj.weight_scale": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.32.gate_proj.weight": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.32.gate_proj.weight_scale": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.32.up_proj.weight": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.32.up_proj.weight_scale": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.33.down_proj.weight": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.33.down_proj.weight_scale": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.33.gate_proj.weight": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.33.gate_proj.weight_scale": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.33.up_proj.weight": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.33.up_proj.weight_scale": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.34.down_proj.weight": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.34.down_proj.weight_scale": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.34.gate_proj.weight": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.34.gate_proj.weight_scale": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.34.up_proj.weight": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.34.up_proj.weight_scale": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.35.down_proj.weight": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.35.down_proj.weight_scale": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.35.gate_proj.weight": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.35.gate_proj.weight_scale": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.35.up_proj.weight": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.35.up_proj.weight_scale": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.36.down_proj.weight": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.36.down_proj.weight_scale": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.36.gate_proj.weight": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.36.gate_proj.weight_scale": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.36.up_proj.weight": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.36.up_proj.weight_scale": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.37.down_proj.weight": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.37.down_proj.weight_scale": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.37.gate_proj.weight": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.37.gate_proj.weight_scale": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.37.up_proj.weight": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.37.up_proj.weight_scale": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.38.down_proj.weight": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.38.down_proj.weight_scale": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.38.gate_proj.weight": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.38.gate_proj.weight_scale": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.38.up_proj.weight": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.38.up_proj.weight_scale": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.39.down_proj.weight": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.39.down_proj.weight_scale": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.39.gate_proj.weight": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.39.gate_proj.weight_scale": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.39.up_proj.weight": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.39.up_proj.weight_scale": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.4.down_proj.weight": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.4.down_proj.weight_scale": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.4.gate_proj.weight": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.4.gate_proj.weight_scale": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.4.up_proj.weight": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.4.up_proj.weight_scale": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.40.down_proj.weight": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.40.down_proj.weight_scale": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.40.gate_proj.weight": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.40.gate_proj.weight_scale": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.40.up_proj.weight": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.40.up_proj.weight_scale": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.41.down_proj.weight": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.41.down_proj.weight_scale": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.41.gate_proj.weight": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.41.gate_proj.weight_scale": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.41.up_proj.weight": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.41.up_proj.weight_scale": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.42.down_proj.weight": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.42.down_proj.weight_scale": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.42.gate_proj.weight": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.42.gate_proj.weight_scale": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.42.up_proj.weight": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.42.up_proj.weight_scale": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.43.down_proj.weight": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.43.down_proj.weight_scale": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.43.gate_proj.weight": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.43.gate_proj.weight_scale": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.43.up_proj.weight": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.43.up_proj.weight_scale": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.44.down_proj.weight": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.44.down_proj.weight_scale": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.44.gate_proj.weight": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.44.gate_proj.weight_scale": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.44.up_proj.weight": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.44.up_proj.weight_scale": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.45.down_proj.weight": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.45.down_proj.weight_scale": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.45.gate_proj.weight": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.45.gate_proj.weight_scale": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.45.up_proj.weight": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.45.up_proj.weight_scale": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.46.down_proj.weight": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.46.down_proj.weight_scale": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.46.gate_proj.weight": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.46.gate_proj.weight_scale": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.46.up_proj.weight": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.46.up_proj.weight_scale": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.47.down_proj.weight": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.47.down_proj.weight_scale": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.47.gate_proj.weight": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.47.gate_proj.weight_scale": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.47.up_proj.weight": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.47.up_proj.weight_scale": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.48.down_proj.weight": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.48.down_proj.weight_scale": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.48.gate_proj.weight": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.48.gate_proj.weight_scale": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.48.up_proj.weight": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.48.up_proj.weight_scale": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.49.down_proj.weight": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.49.down_proj.weight_scale": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.49.gate_proj.weight": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.49.gate_proj.weight_scale": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.49.up_proj.weight": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.49.up_proj.weight_scale": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.5.down_proj.weight": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.5.down_proj.weight_scale": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.5.gate_proj.weight": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.5.gate_proj.weight_scale": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.5.up_proj.weight": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.5.up_proj.weight_scale": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.50.down_proj.weight": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.50.down_proj.weight_scale": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.50.gate_proj.weight": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.50.gate_proj.weight_scale": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.50.up_proj.weight": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.50.up_proj.weight_scale": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.51.down_proj.weight": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.51.down_proj.weight_scale": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.51.gate_proj.weight": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.51.gate_proj.weight_scale": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.51.up_proj.weight": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.51.up_proj.weight_scale": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.52.down_proj.weight": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.52.down_proj.weight_scale": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.52.gate_proj.weight": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.52.gate_proj.weight_scale": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.52.up_proj.weight": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.52.up_proj.weight_scale": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.53.down_proj.weight": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.53.down_proj.weight_scale": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.53.gate_proj.weight": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.53.gate_proj.weight_scale": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.53.up_proj.weight": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.53.up_proj.weight_scale": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.54.down_proj.weight": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.54.down_proj.weight_scale": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.54.gate_proj.weight": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.54.gate_proj.weight_scale": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.54.up_proj.weight": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.54.up_proj.weight_scale": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.55.down_proj.weight": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.55.down_proj.weight_scale": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.55.gate_proj.weight": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.55.gate_proj.weight_scale": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.55.up_proj.weight": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.55.up_proj.weight_scale": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.56.down_proj.weight": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.56.down_proj.weight_scale": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.56.gate_proj.weight": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.56.gate_proj.weight_scale": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.56.up_proj.weight": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.56.up_proj.weight_scale": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.57.down_proj.weight": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.57.down_proj.weight_scale": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.57.gate_proj.weight": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.57.gate_proj.weight_scale": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.57.up_proj.weight": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.57.up_proj.weight_scale": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.58.down_proj.weight": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.58.down_proj.weight_scale": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.58.gate_proj.weight": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.58.gate_proj.weight_scale": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.58.up_proj.weight": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.58.up_proj.weight_scale": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.59.down_proj.weight": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.59.down_proj.weight_scale": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.59.gate_proj.weight": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.59.gate_proj.weight_scale": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.59.up_proj.weight": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.59.up_proj.weight_scale": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.6.down_proj.weight": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.6.down_proj.weight_scale": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.6.gate_proj.weight": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.6.gate_proj.weight_scale": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.6.up_proj.weight": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.6.up_proj.weight_scale": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.60.down_proj.weight": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.60.down_proj.weight_scale": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.60.gate_proj.weight": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.60.gate_proj.weight_scale": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.60.up_proj.weight": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.60.up_proj.weight_scale": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.61.down_proj.weight": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.61.down_proj.weight_scale": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.61.gate_proj.weight": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.61.gate_proj.weight_scale": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.61.up_proj.weight": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.61.up_proj.weight_scale": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.62.down_proj.weight": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.62.down_proj.weight_scale": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.62.gate_proj.weight": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.62.gate_proj.weight_scale": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.62.up_proj.weight": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.62.up_proj.weight_scale": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.63.down_proj.weight": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.63.down_proj.weight_scale": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.63.gate_proj.weight": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.63.gate_proj.weight_scale": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.63.up_proj.weight": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.63.up_proj.weight_scale": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.64.down_proj.weight": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.64.down_proj.weight_scale": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.64.gate_proj.weight": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.64.gate_proj.weight_scale": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.64.up_proj.weight": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.64.up_proj.weight_scale": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.65.down_proj.weight": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.65.down_proj.weight_scale": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.65.gate_proj.weight": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.65.gate_proj.weight_scale": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.65.up_proj.weight": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.65.up_proj.weight_scale": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.66.down_proj.weight": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.66.down_proj.weight_scale": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.66.gate_proj.weight": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.66.gate_proj.weight_scale": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.66.up_proj.weight": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.66.up_proj.weight_scale": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.67.down_proj.weight": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.67.down_proj.weight_scale": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.67.gate_proj.weight": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.67.gate_proj.weight_scale": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.67.up_proj.weight": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.67.up_proj.weight_scale": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.68.down_proj.weight": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.68.down_proj.weight_scale": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.68.gate_proj.weight": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.68.gate_proj.weight_scale": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.68.up_proj.weight": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.68.up_proj.weight_scale": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.69.down_proj.weight": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.69.down_proj.weight_scale": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.69.gate_proj.weight": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.69.gate_proj.weight_scale": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.69.up_proj.weight": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.69.up_proj.weight_scale": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.7.down_proj.weight": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.7.down_proj.weight_scale": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.7.gate_proj.weight": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.7.gate_proj.weight_scale": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.7.up_proj.weight": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.7.up_proj.weight_scale": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.70.down_proj.weight": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.70.down_proj.weight_scale": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.70.gate_proj.weight": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.70.gate_proj.weight_scale": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.70.up_proj.weight": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.70.up_proj.weight_scale": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.71.down_proj.weight": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.71.down_proj.weight_scale": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.71.gate_proj.weight": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.71.gate_proj.weight_scale": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.71.up_proj.weight": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.71.up_proj.weight_scale": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.72.down_proj.weight": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.72.down_proj.weight_scale": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.72.gate_proj.weight": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.72.gate_proj.weight_scale": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.72.up_proj.weight": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.72.up_proj.weight_scale": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.73.down_proj.weight": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.73.down_proj.weight_scale": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.73.gate_proj.weight": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.73.gate_proj.weight_scale": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.73.up_proj.weight": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.73.up_proj.weight_scale": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.74.down_proj.weight": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.74.down_proj.weight_scale": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.74.gate_proj.weight": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.74.gate_proj.weight_scale": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.74.up_proj.weight": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.74.up_proj.weight_scale": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.75.down_proj.weight": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.75.down_proj.weight_scale": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.75.gate_proj.weight": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.75.gate_proj.weight_scale": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.75.up_proj.weight": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.75.up_proj.weight_scale": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.76.down_proj.weight": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.76.down_proj.weight_scale": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.76.gate_proj.weight": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.76.gate_proj.weight_scale": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.76.up_proj.weight": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.76.up_proj.weight_scale": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.77.down_proj.weight": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.77.down_proj.weight_scale": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.77.gate_proj.weight": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.77.gate_proj.weight_scale": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.77.up_proj.weight": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.77.up_proj.weight_scale": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.78.down_proj.weight": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.78.down_proj.weight_scale": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.78.gate_proj.weight": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.78.gate_proj.weight_scale": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.78.up_proj.weight": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.78.up_proj.weight_scale": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.79.down_proj.weight": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.79.down_proj.weight_scale": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.79.gate_proj.weight": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.79.gate_proj.weight_scale": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.79.up_proj.weight": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.79.up_proj.weight_scale": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.8.down_proj.weight": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.8.down_proj.weight_scale": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.8.gate_proj.weight": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.8.gate_proj.weight_scale": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.8.up_proj.weight": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.8.up_proj.weight_scale": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.80.down_proj.weight": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.80.down_proj.weight_scale": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.80.gate_proj.weight": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.80.gate_proj.weight_scale": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.80.up_proj.weight": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.80.up_proj.weight_scale": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.81.down_proj.weight": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.81.down_proj.weight_scale": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.81.gate_proj.weight": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.81.gate_proj.weight_scale": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.81.up_proj.weight": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.81.up_proj.weight_scale": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.82.down_proj.weight": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.82.down_proj.weight_scale": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.82.gate_proj.weight": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.82.gate_proj.weight_scale": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.82.up_proj.weight": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.82.up_proj.weight_scale": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.83.down_proj.weight": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.83.down_proj.weight_scale": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.83.gate_proj.weight": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.83.gate_proj.weight_scale": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.83.up_proj.weight": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.83.up_proj.weight_scale": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.84.down_proj.weight": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.84.down_proj.weight_scale": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.84.gate_proj.weight": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.84.gate_proj.weight_scale": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.84.up_proj.weight": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.84.up_proj.weight_scale": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.85.down_proj.weight": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.85.down_proj.weight_scale": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.85.gate_proj.weight": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.85.gate_proj.weight_scale": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.85.up_proj.weight": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.85.up_proj.weight_scale": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.86.down_proj.weight": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.86.down_proj.weight_scale": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.86.gate_proj.weight": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.86.gate_proj.weight_scale": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.86.up_proj.weight": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.86.up_proj.weight_scale": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.87.down_proj.weight": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.87.down_proj.weight_scale": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.87.gate_proj.weight": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.87.gate_proj.weight_scale": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.87.up_proj.weight": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.87.up_proj.weight_scale": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.88.down_proj.weight": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.88.down_proj.weight_scale": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.88.gate_proj.weight": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.88.gate_proj.weight_scale": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.88.up_proj.weight": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.88.up_proj.weight_scale": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.89.down_proj.weight": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.89.down_proj.weight_scale": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.89.gate_proj.weight": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.89.gate_proj.weight_scale": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.89.up_proj.weight": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.89.up_proj.weight_scale": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.9.down_proj.weight": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.9.down_proj.weight_scale": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.9.gate_proj.weight": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.9.gate_proj.weight_scale": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.9.up_proj.weight": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.9.up_proj.weight_scale": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.90.down_proj.weight": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.90.down_proj.weight_scale": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.90.gate_proj.weight": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.90.gate_proj.weight_scale": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.90.up_proj.weight": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.90.up_proj.weight_scale": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.91.down_proj.weight": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.91.down_proj.weight_scale": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.91.gate_proj.weight": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.91.gate_proj.weight_scale": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.91.up_proj.weight": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.91.up_proj.weight_scale": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.92.down_proj.weight": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.92.down_proj.weight_scale": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.92.gate_proj.weight": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.92.gate_proj.weight_scale": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.92.up_proj.weight": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.92.up_proj.weight_scale": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.93.down_proj.weight": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.93.down_proj.weight_scale": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.93.gate_proj.weight": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.93.gate_proj.weight_scale": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.93.up_proj.weight": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.93.up_proj.weight_scale": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.94.down_proj.weight": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.94.down_proj.weight_scale": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.94.gate_proj.weight": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.94.gate_proj.weight_scale": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.94.up_proj.weight": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.94.up_proj.weight_scale": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.95.down_proj.weight": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.95.down_proj.weight_scale": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.95.gate_proj.weight": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.95.gate_proj.weight_scale": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.95.up_proj.weight": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.95.up_proj.weight_scale": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.96.down_proj.weight": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.96.down_proj.weight_scale": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.96.gate_proj.weight": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.96.gate_proj.weight_scale": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.96.up_proj.weight": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.96.up_proj.weight_scale": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.97.down_proj.weight": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.97.down_proj.weight_scale": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.97.gate_proj.weight": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.97.gate_proj.weight_scale": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.97.up_proj.weight": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.97.up_proj.weight_scale": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.98.down_proj.weight": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.98.down_proj.weight_scale": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.98.gate_proj.weight": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.98.gate_proj.weight_scale": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.98.up_proj.weight": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.98.up_proj.weight_scale": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.99.down_proj.weight": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.99.down_proj.weight_scale": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.99.gate_proj.weight": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.99.gate_proj.weight_scale": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.99.up_proj.weight": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.99.up_proj.weight_scale": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.gate.e_score_correction_bias": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.gate.weight": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.shared_experts.down_proj.weight": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.shared_experts.down_proj.weight_scale": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.shared_experts.gate_proj.weight": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.shared_experts.gate_proj.weight_scale": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.shared_experts.up_proj.weight": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.shared_experts.up_proj.weight_scale": "model-00046-of-00092.safetensors",
+ "model.layers.45.post_attention_layernorm.weight": "model-00046-of-00092.safetensors",
+ "model.layers.45.self_attn.k_norm.weight": "model-00046-of-00092.safetensors",
+ "model.layers.45.self_attn.k_proj.bias": "model-00046-of-00092.safetensors",
+ "model.layers.45.self_attn.k_proj.weight": "model-00046-of-00092.safetensors",
+ "model.layers.45.self_attn.k_proj.weight_scale": "model-00046-of-00092.safetensors",
+ "model.layers.45.self_attn.o_proj.weight": "model-00046-of-00092.safetensors",
+ "model.layers.45.self_attn.o_proj.weight_scale": "model-00046-of-00092.safetensors",
+ "model.layers.45.self_attn.q_norm.weight": "model-00046-of-00092.safetensors",
+ "model.layers.45.self_attn.q_proj.bias": "model-00046-of-00092.safetensors",
+ "model.layers.45.self_attn.q_proj.weight": "model-00046-of-00092.safetensors",
+ "model.layers.45.self_attn.q_proj.weight_scale": "model-00046-of-00092.safetensors",
+ "model.layers.45.self_attn.v_proj.bias": "model-00046-of-00092.safetensors",
+ "model.layers.45.self_attn.v_proj.weight": "model-00046-of-00092.safetensors",
+ "model.layers.45.self_attn.v_proj.weight_scale": "model-00046-of-00092.safetensors",
+ "model.layers.46.input_layernorm.weight": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.0.down_proj.weight": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.0.down_proj.weight_scale": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.0.gate_proj.weight": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.0.gate_proj.weight_scale": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.0.up_proj.weight": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.0.up_proj.weight_scale": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.1.down_proj.weight": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.1.down_proj.weight_scale": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.1.gate_proj.weight": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.1.gate_proj.weight_scale": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.1.up_proj.weight": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.1.up_proj.weight_scale": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.10.down_proj.weight": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.10.down_proj.weight_scale": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.10.gate_proj.weight": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.10.gate_proj.weight_scale": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.10.up_proj.weight": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.10.up_proj.weight_scale": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.100.down_proj.weight": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.100.down_proj.weight_scale": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.100.gate_proj.weight": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.100.gate_proj.weight_scale": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.100.up_proj.weight": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.100.up_proj.weight_scale": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.101.down_proj.weight": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.101.down_proj.weight_scale": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.101.gate_proj.weight": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.101.gate_proj.weight_scale": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.101.up_proj.weight": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.101.up_proj.weight_scale": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.102.down_proj.weight": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.102.down_proj.weight_scale": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.102.gate_proj.weight": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.102.gate_proj.weight_scale": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.102.up_proj.weight": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.102.up_proj.weight_scale": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.103.down_proj.weight": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.103.down_proj.weight_scale": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.103.gate_proj.weight": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.103.gate_proj.weight_scale": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.103.up_proj.weight": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.103.up_proj.weight_scale": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.104.down_proj.weight": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.104.down_proj.weight_scale": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.104.gate_proj.weight": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.104.gate_proj.weight_scale": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.104.up_proj.weight": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.104.up_proj.weight_scale": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.105.down_proj.weight": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.105.down_proj.weight_scale": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.105.gate_proj.weight": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.105.gate_proj.weight_scale": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.105.up_proj.weight": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.105.up_proj.weight_scale": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.106.down_proj.weight": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.106.down_proj.weight_scale": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.106.gate_proj.weight": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.106.gate_proj.weight_scale": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.106.up_proj.weight": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.106.up_proj.weight_scale": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.107.down_proj.weight": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.107.down_proj.weight_scale": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.107.gate_proj.weight": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.107.gate_proj.weight_scale": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.107.up_proj.weight": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.107.up_proj.weight_scale": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.108.down_proj.weight": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.108.down_proj.weight_scale": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.108.gate_proj.weight": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.108.gate_proj.weight_scale": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.108.up_proj.weight": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.108.up_proj.weight_scale": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.109.down_proj.weight": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.109.down_proj.weight_scale": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.109.gate_proj.weight": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.109.gate_proj.weight_scale": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.109.up_proj.weight": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.109.up_proj.weight_scale": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.11.down_proj.weight": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.11.down_proj.weight_scale": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.11.gate_proj.weight": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.11.gate_proj.weight_scale": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.11.up_proj.weight": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.11.up_proj.weight_scale": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.110.down_proj.weight": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.110.down_proj.weight_scale": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.110.gate_proj.weight": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.110.gate_proj.weight_scale": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.110.up_proj.weight": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.110.up_proj.weight_scale": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.111.down_proj.weight": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.111.down_proj.weight_scale": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.111.gate_proj.weight": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.111.gate_proj.weight_scale": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.111.up_proj.weight": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.111.up_proj.weight_scale": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.112.down_proj.weight": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.112.down_proj.weight_scale": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.112.gate_proj.weight": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.112.gate_proj.weight_scale": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.112.up_proj.weight": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.112.up_proj.weight_scale": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.113.down_proj.weight": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.113.down_proj.weight_scale": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.113.gate_proj.weight": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.113.gate_proj.weight_scale": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.113.up_proj.weight": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.113.up_proj.weight_scale": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.114.down_proj.weight": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.114.down_proj.weight_scale": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.114.gate_proj.weight": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.114.gate_proj.weight_scale": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.114.up_proj.weight": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.114.up_proj.weight_scale": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.115.down_proj.weight": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.115.down_proj.weight_scale": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.115.gate_proj.weight": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.115.gate_proj.weight_scale": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.115.up_proj.weight": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.115.up_proj.weight_scale": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.116.down_proj.weight": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.116.down_proj.weight_scale": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.116.gate_proj.weight": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.116.gate_proj.weight_scale": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.116.up_proj.weight": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.116.up_proj.weight_scale": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.117.down_proj.weight": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.117.down_proj.weight_scale": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.117.gate_proj.weight": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.117.gate_proj.weight_scale": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.117.up_proj.weight": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.117.up_proj.weight_scale": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.118.down_proj.weight": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.118.down_proj.weight_scale": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.118.gate_proj.weight": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.118.gate_proj.weight_scale": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.118.up_proj.weight": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.118.up_proj.weight_scale": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.119.down_proj.weight": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.119.down_proj.weight_scale": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.119.gate_proj.weight": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.119.gate_proj.weight_scale": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.119.up_proj.weight": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.119.up_proj.weight_scale": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.12.down_proj.weight": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.12.down_proj.weight_scale": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.12.gate_proj.weight": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.12.gate_proj.weight_scale": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.12.up_proj.weight": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.12.up_proj.weight_scale": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.120.down_proj.weight": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.120.down_proj.weight_scale": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.120.gate_proj.weight": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.120.gate_proj.weight_scale": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.120.up_proj.weight": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.120.up_proj.weight_scale": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.121.down_proj.weight": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.121.down_proj.weight_scale": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.121.gate_proj.weight": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.121.gate_proj.weight_scale": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.121.up_proj.weight": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.121.up_proj.weight_scale": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.122.down_proj.weight": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.122.down_proj.weight_scale": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.122.gate_proj.weight": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.122.gate_proj.weight_scale": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.122.up_proj.weight": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.122.up_proj.weight_scale": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.123.down_proj.weight": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.123.down_proj.weight_scale": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.123.gate_proj.weight": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.123.gate_proj.weight_scale": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.123.up_proj.weight": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.123.up_proj.weight_scale": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.124.down_proj.weight": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.124.down_proj.weight_scale": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.124.gate_proj.weight": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.124.gate_proj.weight_scale": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.124.up_proj.weight": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.124.up_proj.weight_scale": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.125.down_proj.weight": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.125.down_proj.weight_scale": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.125.gate_proj.weight": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.125.gate_proj.weight_scale": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.125.up_proj.weight": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.125.up_proj.weight_scale": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.126.down_proj.weight": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.126.down_proj.weight_scale": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.126.gate_proj.weight": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.126.gate_proj.weight_scale": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.126.up_proj.weight": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.126.up_proj.weight_scale": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.127.down_proj.weight": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.127.down_proj.weight_scale": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.127.gate_proj.weight": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.127.gate_proj.weight_scale": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.127.up_proj.weight": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.127.up_proj.weight_scale": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.128.down_proj.weight": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.128.down_proj.weight_scale": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.128.gate_proj.weight": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.128.gate_proj.weight_scale": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.128.up_proj.weight": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.128.up_proj.weight_scale": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.129.down_proj.weight": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.129.down_proj.weight_scale": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.129.gate_proj.weight": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.129.gate_proj.weight_scale": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.129.up_proj.weight": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.129.up_proj.weight_scale": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.13.down_proj.weight": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.13.down_proj.weight_scale": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.13.gate_proj.weight": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.13.gate_proj.weight_scale": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.13.up_proj.weight": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.13.up_proj.weight_scale": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.130.down_proj.weight": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.130.down_proj.weight_scale": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.130.gate_proj.weight": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.130.gate_proj.weight_scale": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.130.up_proj.weight": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.130.up_proj.weight_scale": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.131.down_proj.weight": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.131.down_proj.weight_scale": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.131.gate_proj.weight": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.131.gate_proj.weight_scale": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.131.up_proj.weight": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.131.up_proj.weight_scale": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.132.down_proj.weight": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.132.down_proj.weight_scale": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.132.gate_proj.weight": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.132.gate_proj.weight_scale": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.132.up_proj.weight": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.132.up_proj.weight_scale": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.133.down_proj.weight": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.133.down_proj.weight_scale": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.133.gate_proj.weight": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.133.gate_proj.weight_scale": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.133.up_proj.weight": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.133.up_proj.weight_scale": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.134.down_proj.weight": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.134.down_proj.weight_scale": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.134.gate_proj.weight": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.134.gate_proj.weight_scale": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.134.up_proj.weight": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.134.up_proj.weight_scale": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.135.down_proj.weight": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.135.down_proj.weight_scale": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.135.gate_proj.weight": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.135.gate_proj.weight_scale": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.135.up_proj.weight": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.135.up_proj.weight_scale": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.136.down_proj.weight": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.136.down_proj.weight_scale": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.136.gate_proj.weight": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.136.gate_proj.weight_scale": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.136.up_proj.weight": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.136.up_proj.weight_scale": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.137.down_proj.weight": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.137.down_proj.weight_scale": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.137.gate_proj.weight": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.137.gate_proj.weight_scale": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.137.up_proj.weight": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.137.up_proj.weight_scale": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.138.down_proj.weight": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.138.down_proj.weight_scale": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.138.gate_proj.weight": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.138.gate_proj.weight_scale": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.138.up_proj.weight": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.138.up_proj.weight_scale": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.139.down_proj.weight": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.139.down_proj.weight_scale": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.139.gate_proj.weight": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.139.gate_proj.weight_scale": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.139.up_proj.weight": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.139.up_proj.weight_scale": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.14.down_proj.weight": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.14.down_proj.weight_scale": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.14.gate_proj.weight": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.14.gate_proj.weight_scale": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.14.up_proj.weight": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.14.up_proj.weight_scale": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.140.down_proj.weight": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.140.down_proj.weight_scale": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.140.gate_proj.weight": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.140.gate_proj.weight_scale": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.140.up_proj.weight": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.140.up_proj.weight_scale": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.141.down_proj.weight": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.141.down_proj.weight_scale": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.141.gate_proj.weight": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.141.gate_proj.weight_scale": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.141.up_proj.weight": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.141.up_proj.weight_scale": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.142.down_proj.weight": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.142.down_proj.weight_scale": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.142.gate_proj.weight": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.142.gate_proj.weight_scale": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.142.up_proj.weight": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.142.up_proj.weight_scale": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.143.down_proj.weight": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.143.down_proj.weight_scale": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.143.gate_proj.weight": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.143.gate_proj.weight_scale": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.143.up_proj.weight": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.143.up_proj.weight_scale": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.144.down_proj.weight": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.144.down_proj.weight_scale": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.144.gate_proj.weight": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.144.gate_proj.weight_scale": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.144.up_proj.weight": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.144.up_proj.weight_scale": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.145.down_proj.weight": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.145.down_proj.weight_scale": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.145.gate_proj.weight": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.145.gate_proj.weight_scale": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.145.up_proj.weight": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.145.up_proj.weight_scale": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.146.down_proj.weight": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.146.down_proj.weight_scale": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.146.gate_proj.weight": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.146.gate_proj.weight_scale": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.146.up_proj.weight": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.146.up_proj.weight_scale": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.147.down_proj.weight": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.147.down_proj.weight_scale": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.147.gate_proj.weight": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.147.gate_proj.weight_scale": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.147.up_proj.weight": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.147.up_proj.weight_scale": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.148.down_proj.weight": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.148.down_proj.weight_scale": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.148.gate_proj.weight": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.148.gate_proj.weight_scale": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.148.up_proj.weight": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.148.up_proj.weight_scale": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.149.down_proj.weight": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.149.down_proj.weight_scale": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.149.gate_proj.weight": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.149.gate_proj.weight_scale": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.149.up_proj.weight": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.149.up_proj.weight_scale": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.15.down_proj.weight": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.15.down_proj.weight_scale": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.15.gate_proj.weight": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.15.gate_proj.weight_scale": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.15.up_proj.weight": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.15.up_proj.weight_scale": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.150.down_proj.weight": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.150.down_proj.weight_scale": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.150.gate_proj.weight": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.150.gate_proj.weight_scale": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.150.up_proj.weight": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.150.up_proj.weight_scale": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.151.down_proj.weight": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.151.down_proj.weight_scale": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.151.gate_proj.weight": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.151.gate_proj.weight_scale": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.151.up_proj.weight": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.151.up_proj.weight_scale": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.152.down_proj.weight": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.152.down_proj.weight_scale": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.152.gate_proj.weight": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.152.gate_proj.weight_scale": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.152.up_proj.weight": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.152.up_proj.weight_scale": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.153.down_proj.weight": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.153.down_proj.weight_scale": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.153.gate_proj.weight": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.153.gate_proj.weight_scale": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.153.up_proj.weight": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.153.up_proj.weight_scale": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.154.down_proj.weight": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.154.down_proj.weight_scale": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.154.gate_proj.weight": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.154.gate_proj.weight_scale": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.154.up_proj.weight": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.154.up_proj.weight_scale": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.155.down_proj.weight": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.155.down_proj.weight_scale": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.155.gate_proj.weight": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.155.gate_proj.weight_scale": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.155.up_proj.weight": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.155.up_proj.weight_scale": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.156.down_proj.weight": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.156.down_proj.weight_scale": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.156.gate_proj.weight": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.156.gate_proj.weight_scale": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.156.up_proj.weight": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.156.up_proj.weight_scale": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.157.down_proj.weight": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.157.down_proj.weight_scale": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.157.gate_proj.weight": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.157.gate_proj.weight_scale": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.157.up_proj.weight": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.157.up_proj.weight_scale": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.158.down_proj.weight": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.158.down_proj.weight_scale": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.158.gate_proj.weight": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.158.gate_proj.weight_scale": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.158.up_proj.weight": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.158.up_proj.weight_scale": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.159.down_proj.weight": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.159.down_proj.weight_scale": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.159.gate_proj.weight": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.159.gate_proj.weight_scale": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.159.up_proj.weight": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.159.up_proj.weight_scale": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.16.down_proj.weight": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.16.down_proj.weight_scale": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.16.gate_proj.weight": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.16.gate_proj.weight_scale": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.16.up_proj.weight": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.16.up_proj.weight_scale": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.17.down_proj.weight": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.17.down_proj.weight_scale": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.17.gate_proj.weight": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.17.gate_proj.weight_scale": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.17.up_proj.weight": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.17.up_proj.weight_scale": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.18.down_proj.weight": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.18.down_proj.weight_scale": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.18.gate_proj.weight": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.18.gate_proj.weight_scale": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.18.up_proj.weight": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.18.up_proj.weight_scale": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.19.down_proj.weight": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.19.down_proj.weight_scale": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.19.gate_proj.weight": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.19.gate_proj.weight_scale": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.19.up_proj.weight": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.19.up_proj.weight_scale": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.2.down_proj.weight": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.2.down_proj.weight_scale": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.2.gate_proj.weight": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.2.gate_proj.weight_scale": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.2.up_proj.weight": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.2.up_proj.weight_scale": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.20.down_proj.weight": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.20.down_proj.weight_scale": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.20.gate_proj.weight": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.20.gate_proj.weight_scale": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.20.up_proj.weight": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.20.up_proj.weight_scale": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.21.down_proj.weight": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.21.down_proj.weight_scale": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.21.gate_proj.weight": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.21.gate_proj.weight_scale": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.21.up_proj.weight": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.21.up_proj.weight_scale": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.22.down_proj.weight": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.22.down_proj.weight_scale": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.22.gate_proj.weight": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.22.gate_proj.weight_scale": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.22.up_proj.weight": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.22.up_proj.weight_scale": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.23.down_proj.weight": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.23.down_proj.weight_scale": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.23.gate_proj.weight": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.23.gate_proj.weight_scale": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.23.up_proj.weight": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.23.up_proj.weight_scale": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.24.down_proj.weight": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.24.down_proj.weight_scale": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.24.gate_proj.weight": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.24.gate_proj.weight_scale": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.24.up_proj.weight": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.24.up_proj.weight_scale": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.25.down_proj.weight": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.25.down_proj.weight_scale": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.25.gate_proj.weight": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.25.gate_proj.weight_scale": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.25.up_proj.weight": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.25.up_proj.weight_scale": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.26.down_proj.weight": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.26.down_proj.weight_scale": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.26.gate_proj.weight": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.26.gate_proj.weight_scale": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.26.up_proj.weight": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.26.up_proj.weight_scale": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.27.down_proj.weight": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.27.down_proj.weight_scale": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.27.gate_proj.weight": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.27.gate_proj.weight_scale": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.27.up_proj.weight": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.27.up_proj.weight_scale": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.28.down_proj.weight": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.28.down_proj.weight_scale": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.28.gate_proj.weight": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.28.gate_proj.weight_scale": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.28.up_proj.weight": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.28.up_proj.weight_scale": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.29.down_proj.weight": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.29.down_proj.weight_scale": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.29.gate_proj.weight": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.29.gate_proj.weight_scale": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.29.up_proj.weight": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.29.up_proj.weight_scale": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.3.down_proj.weight": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.3.down_proj.weight_scale": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.3.gate_proj.weight": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.3.gate_proj.weight_scale": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.3.up_proj.weight": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.3.up_proj.weight_scale": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.30.down_proj.weight": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.30.down_proj.weight_scale": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.30.gate_proj.weight": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.30.gate_proj.weight_scale": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.30.up_proj.weight": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.30.up_proj.weight_scale": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.31.down_proj.weight": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.31.down_proj.weight_scale": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.31.gate_proj.weight": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.31.gate_proj.weight_scale": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.31.up_proj.weight": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.31.up_proj.weight_scale": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.32.down_proj.weight": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.32.down_proj.weight_scale": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.32.gate_proj.weight": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.32.gate_proj.weight_scale": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.32.up_proj.weight": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.32.up_proj.weight_scale": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.33.down_proj.weight": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.33.down_proj.weight_scale": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.33.gate_proj.weight": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.33.gate_proj.weight_scale": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.33.up_proj.weight": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.33.up_proj.weight_scale": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.34.down_proj.weight": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.34.down_proj.weight_scale": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.34.gate_proj.weight": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.34.gate_proj.weight_scale": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.34.up_proj.weight": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.34.up_proj.weight_scale": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.35.down_proj.weight": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.35.down_proj.weight_scale": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.35.gate_proj.weight": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.35.gate_proj.weight_scale": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.35.up_proj.weight": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.35.up_proj.weight_scale": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.36.down_proj.weight": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.36.down_proj.weight_scale": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.36.gate_proj.weight": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.36.gate_proj.weight_scale": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.36.up_proj.weight": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.36.up_proj.weight_scale": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.37.down_proj.weight": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.37.down_proj.weight_scale": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.37.gate_proj.weight": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.37.gate_proj.weight_scale": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.37.up_proj.weight": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.37.up_proj.weight_scale": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.38.down_proj.weight": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.38.down_proj.weight_scale": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.38.gate_proj.weight": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.38.gate_proj.weight_scale": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.38.up_proj.weight": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.38.up_proj.weight_scale": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.39.down_proj.weight": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.39.down_proj.weight_scale": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.39.gate_proj.weight": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.39.gate_proj.weight_scale": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.39.up_proj.weight": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.39.up_proj.weight_scale": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.4.down_proj.weight": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.4.down_proj.weight_scale": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.4.gate_proj.weight": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.4.gate_proj.weight_scale": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.4.up_proj.weight": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.4.up_proj.weight_scale": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.40.down_proj.weight": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.40.down_proj.weight_scale": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.40.gate_proj.weight": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.40.gate_proj.weight_scale": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.40.up_proj.weight": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.40.up_proj.weight_scale": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.41.down_proj.weight": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.41.down_proj.weight_scale": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.41.gate_proj.weight": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.41.gate_proj.weight_scale": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.41.up_proj.weight": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.41.up_proj.weight_scale": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.42.down_proj.weight": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.42.down_proj.weight_scale": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.42.gate_proj.weight": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.42.gate_proj.weight_scale": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.42.up_proj.weight": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.42.up_proj.weight_scale": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.43.down_proj.weight": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.43.down_proj.weight_scale": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.43.gate_proj.weight": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.43.gate_proj.weight_scale": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.43.up_proj.weight": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.43.up_proj.weight_scale": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.44.down_proj.weight": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.44.down_proj.weight_scale": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.44.gate_proj.weight": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.44.gate_proj.weight_scale": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.44.up_proj.weight": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.44.up_proj.weight_scale": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.45.down_proj.weight": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.45.down_proj.weight_scale": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.45.gate_proj.weight": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.45.gate_proj.weight_scale": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.45.up_proj.weight": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.45.up_proj.weight_scale": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.46.down_proj.weight": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.46.down_proj.weight_scale": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.46.gate_proj.weight": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.46.gate_proj.weight_scale": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.46.up_proj.weight": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.46.up_proj.weight_scale": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.47.down_proj.weight": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.47.down_proj.weight_scale": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.47.gate_proj.weight": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.47.gate_proj.weight_scale": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.47.up_proj.weight": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.47.up_proj.weight_scale": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.48.down_proj.weight": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.48.down_proj.weight_scale": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.48.gate_proj.weight": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.48.gate_proj.weight_scale": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.48.up_proj.weight": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.48.up_proj.weight_scale": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.49.down_proj.weight": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.49.down_proj.weight_scale": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.49.gate_proj.weight": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.49.gate_proj.weight_scale": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.49.up_proj.weight": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.49.up_proj.weight_scale": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.5.down_proj.weight": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.5.down_proj.weight_scale": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.5.gate_proj.weight": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.5.gate_proj.weight_scale": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.5.up_proj.weight": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.5.up_proj.weight_scale": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.50.down_proj.weight": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.50.down_proj.weight_scale": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.50.gate_proj.weight": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.50.gate_proj.weight_scale": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.50.up_proj.weight": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.50.up_proj.weight_scale": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.51.down_proj.weight": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.51.down_proj.weight_scale": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.51.gate_proj.weight": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.51.gate_proj.weight_scale": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.51.up_proj.weight": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.51.up_proj.weight_scale": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.52.down_proj.weight": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.52.down_proj.weight_scale": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.52.gate_proj.weight": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.52.gate_proj.weight_scale": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.52.up_proj.weight": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.52.up_proj.weight_scale": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.53.down_proj.weight": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.53.down_proj.weight_scale": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.53.gate_proj.weight": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.53.gate_proj.weight_scale": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.53.up_proj.weight": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.53.up_proj.weight_scale": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.54.down_proj.weight": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.54.down_proj.weight_scale": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.54.gate_proj.weight": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.54.gate_proj.weight_scale": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.54.up_proj.weight": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.54.up_proj.weight_scale": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.55.down_proj.weight": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.55.down_proj.weight_scale": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.55.gate_proj.weight": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.55.gate_proj.weight_scale": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.55.up_proj.weight": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.55.up_proj.weight_scale": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.56.down_proj.weight": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.56.down_proj.weight_scale": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.56.gate_proj.weight": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.56.gate_proj.weight_scale": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.56.up_proj.weight": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.56.up_proj.weight_scale": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.57.down_proj.weight": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.57.down_proj.weight_scale": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.57.gate_proj.weight": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.57.gate_proj.weight_scale": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.57.up_proj.weight": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.57.up_proj.weight_scale": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.58.down_proj.weight": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.58.down_proj.weight_scale": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.58.gate_proj.weight": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.58.gate_proj.weight_scale": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.58.up_proj.weight": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.58.up_proj.weight_scale": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.59.down_proj.weight": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.59.down_proj.weight_scale": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.59.gate_proj.weight": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.59.gate_proj.weight_scale": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.59.up_proj.weight": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.59.up_proj.weight_scale": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.6.down_proj.weight": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.6.down_proj.weight_scale": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.6.gate_proj.weight": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.6.gate_proj.weight_scale": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.6.up_proj.weight": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.6.up_proj.weight_scale": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.60.down_proj.weight": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.60.down_proj.weight_scale": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.60.gate_proj.weight": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.60.gate_proj.weight_scale": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.60.up_proj.weight": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.60.up_proj.weight_scale": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.61.down_proj.weight": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.61.down_proj.weight_scale": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.61.gate_proj.weight": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.61.gate_proj.weight_scale": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.61.up_proj.weight": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.61.up_proj.weight_scale": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.62.down_proj.weight": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.62.down_proj.weight_scale": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.62.gate_proj.weight": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.62.gate_proj.weight_scale": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.62.up_proj.weight": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.62.up_proj.weight_scale": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.63.down_proj.weight": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.63.down_proj.weight_scale": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.63.gate_proj.weight": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.63.gate_proj.weight_scale": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.63.up_proj.weight": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.63.up_proj.weight_scale": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.64.down_proj.weight": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.64.down_proj.weight_scale": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.64.gate_proj.weight": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.64.gate_proj.weight_scale": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.64.up_proj.weight": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.64.up_proj.weight_scale": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.65.down_proj.weight": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.65.down_proj.weight_scale": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.65.gate_proj.weight": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.65.gate_proj.weight_scale": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.65.up_proj.weight": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.65.up_proj.weight_scale": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.66.down_proj.weight": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.66.down_proj.weight_scale": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.66.gate_proj.weight": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.66.gate_proj.weight_scale": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.66.up_proj.weight": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.66.up_proj.weight_scale": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.67.down_proj.weight": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.67.down_proj.weight_scale": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.67.gate_proj.weight": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.67.gate_proj.weight_scale": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.67.up_proj.weight": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.67.up_proj.weight_scale": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.68.down_proj.weight": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.68.down_proj.weight_scale": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.68.gate_proj.weight": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.68.gate_proj.weight_scale": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.68.up_proj.weight": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.68.up_proj.weight_scale": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.69.down_proj.weight": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.69.down_proj.weight_scale": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.69.gate_proj.weight": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.69.gate_proj.weight_scale": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.69.up_proj.weight": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.69.up_proj.weight_scale": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.7.down_proj.weight": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.7.down_proj.weight_scale": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.7.gate_proj.weight": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.7.gate_proj.weight_scale": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.7.up_proj.weight": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.7.up_proj.weight_scale": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.70.down_proj.weight": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.70.down_proj.weight_scale": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.70.gate_proj.weight": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.70.gate_proj.weight_scale": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.70.up_proj.weight": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.70.up_proj.weight_scale": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.71.down_proj.weight": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.71.down_proj.weight_scale": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.71.gate_proj.weight": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.71.gate_proj.weight_scale": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.71.up_proj.weight": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.71.up_proj.weight_scale": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.72.down_proj.weight": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.72.down_proj.weight_scale": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.72.gate_proj.weight": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.72.gate_proj.weight_scale": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.72.up_proj.weight": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.72.up_proj.weight_scale": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.73.down_proj.weight": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.73.down_proj.weight_scale": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.73.gate_proj.weight": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.73.gate_proj.weight_scale": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.73.up_proj.weight": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.73.up_proj.weight_scale": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.74.down_proj.weight": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.74.down_proj.weight_scale": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.74.gate_proj.weight": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.74.gate_proj.weight_scale": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.74.up_proj.weight": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.74.up_proj.weight_scale": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.75.down_proj.weight": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.75.down_proj.weight_scale": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.75.gate_proj.weight": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.75.gate_proj.weight_scale": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.75.up_proj.weight": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.75.up_proj.weight_scale": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.76.down_proj.weight": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.76.down_proj.weight_scale": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.76.gate_proj.weight": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.76.gate_proj.weight_scale": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.76.up_proj.weight": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.76.up_proj.weight_scale": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.77.down_proj.weight": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.77.down_proj.weight_scale": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.77.gate_proj.weight": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.77.gate_proj.weight_scale": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.77.up_proj.weight": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.77.up_proj.weight_scale": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.78.down_proj.weight": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.78.down_proj.weight_scale": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.78.gate_proj.weight": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.78.gate_proj.weight_scale": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.78.up_proj.weight": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.78.up_proj.weight_scale": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.79.down_proj.weight": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.79.down_proj.weight_scale": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.79.gate_proj.weight": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.79.gate_proj.weight_scale": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.79.up_proj.weight": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.79.up_proj.weight_scale": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.8.down_proj.weight": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.8.down_proj.weight_scale": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.8.gate_proj.weight": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.8.gate_proj.weight_scale": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.8.up_proj.weight": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.8.up_proj.weight_scale": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.80.down_proj.weight": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.80.down_proj.weight_scale": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.80.gate_proj.weight": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.80.gate_proj.weight_scale": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.80.up_proj.weight": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.80.up_proj.weight_scale": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.81.down_proj.weight": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.81.down_proj.weight_scale": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.81.gate_proj.weight": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.81.gate_proj.weight_scale": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.81.up_proj.weight": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.81.up_proj.weight_scale": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.82.down_proj.weight": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.82.down_proj.weight_scale": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.82.gate_proj.weight": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.82.gate_proj.weight_scale": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.82.up_proj.weight": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.82.up_proj.weight_scale": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.83.down_proj.weight": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.83.down_proj.weight_scale": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.83.gate_proj.weight": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.83.gate_proj.weight_scale": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.83.up_proj.weight": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.83.up_proj.weight_scale": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.84.down_proj.weight": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.84.down_proj.weight_scale": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.84.gate_proj.weight": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.84.gate_proj.weight_scale": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.84.up_proj.weight": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.84.up_proj.weight_scale": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.85.down_proj.weight": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.85.down_proj.weight_scale": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.85.gate_proj.weight": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.85.gate_proj.weight_scale": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.85.up_proj.weight": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.85.up_proj.weight_scale": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.86.down_proj.weight": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.86.down_proj.weight_scale": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.86.gate_proj.weight": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.86.gate_proj.weight_scale": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.86.up_proj.weight": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.86.up_proj.weight_scale": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.87.down_proj.weight": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.87.down_proj.weight_scale": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.87.gate_proj.weight": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.87.gate_proj.weight_scale": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.87.up_proj.weight": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.87.up_proj.weight_scale": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.88.down_proj.weight": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.88.down_proj.weight_scale": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.88.gate_proj.weight": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.88.gate_proj.weight_scale": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.88.up_proj.weight": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.88.up_proj.weight_scale": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.89.down_proj.weight": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.89.down_proj.weight_scale": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.89.gate_proj.weight": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.89.gate_proj.weight_scale": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.89.up_proj.weight": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.89.up_proj.weight_scale": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.9.down_proj.weight": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.9.down_proj.weight_scale": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.9.gate_proj.weight": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.9.gate_proj.weight_scale": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.9.up_proj.weight": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.9.up_proj.weight_scale": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.90.down_proj.weight": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.90.down_proj.weight_scale": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.90.gate_proj.weight": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.90.gate_proj.weight_scale": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.90.up_proj.weight": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.90.up_proj.weight_scale": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.91.down_proj.weight": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.91.down_proj.weight_scale": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.91.gate_proj.weight": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.91.gate_proj.weight_scale": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.91.up_proj.weight": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.91.up_proj.weight_scale": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.92.down_proj.weight": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.92.down_proj.weight_scale": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.92.gate_proj.weight": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.92.gate_proj.weight_scale": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.92.up_proj.weight": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.92.up_proj.weight_scale": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.93.down_proj.weight": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.93.down_proj.weight_scale": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.93.gate_proj.weight": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.93.gate_proj.weight_scale": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.93.up_proj.weight": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.93.up_proj.weight_scale": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.94.down_proj.weight": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.94.down_proj.weight_scale": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.94.gate_proj.weight": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.94.gate_proj.weight_scale": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.94.up_proj.weight": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.94.up_proj.weight_scale": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.95.down_proj.weight": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.95.down_proj.weight_scale": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.95.gate_proj.weight": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.95.gate_proj.weight_scale": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.95.up_proj.weight": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.95.up_proj.weight_scale": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.96.down_proj.weight": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.96.down_proj.weight_scale": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.96.gate_proj.weight": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.96.gate_proj.weight_scale": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.96.up_proj.weight": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.96.up_proj.weight_scale": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.97.down_proj.weight": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.97.down_proj.weight_scale": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.97.gate_proj.weight": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.97.gate_proj.weight_scale": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.97.up_proj.weight": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.97.up_proj.weight_scale": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.98.down_proj.weight": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.98.down_proj.weight_scale": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.98.gate_proj.weight": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.98.gate_proj.weight_scale": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.98.up_proj.weight": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.98.up_proj.weight_scale": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.99.down_proj.weight": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.99.down_proj.weight_scale": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.99.gate_proj.weight": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.99.gate_proj.weight_scale": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.99.up_proj.weight": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.99.up_proj.weight_scale": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.gate.e_score_correction_bias": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.gate.weight": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.shared_experts.down_proj.weight": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.shared_experts.down_proj.weight_scale": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.shared_experts.gate_proj.weight": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.shared_experts.gate_proj.weight_scale": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.shared_experts.up_proj.weight": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.shared_experts.up_proj.weight_scale": "model-00047-of-00092.safetensors",
+ "model.layers.46.post_attention_layernorm.weight": "model-00047-of-00092.safetensors",
+ "model.layers.46.self_attn.k_norm.weight": "model-00047-of-00092.safetensors",
+ "model.layers.46.self_attn.k_proj.bias": "model-00047-of-00092.safetensors",
+ "model.layers.46.self_attn.k_proj.weight": "model-00047-of-00092.safetensors",
+ "model.layers.46.self_attn.k_proj.weight_scale": "model-00047-of-00092.safetensors",
+ "model.layers.46.self_attn.o_proj.weight": "model-00047-of-00092.safetensors",
+ "model.layers.46.self_attn.o_proj.weight_scale": "model-00047-of-00092.safetensors",
+ "model.layers.46.self_attn.q_norm.weight": "model-00047-of-00092.safetensors",
+ "model.layers.46.self_attn.q_proj.bias": "model-00047-of-00092.safetensors",
+ "model.layers.46.self_attn.q_proj.weight": "model-00047-of-00092.safetensors",
+ "model.layers.46.self_attn.q_proj.weight_scale": "model-00047-of-00092.safetensors",
+ "model.layers.46.self_attn.v_proj.bias": "model-00047-of-00092.safetensors",
+ "model.layers.46.self_attn.v_proj.weight": "model-00047-of-00092.safetensors",
+ "model.layers.46.self_attn.v_proj.weight_scale": "model-00047-of-00092.safetensors",
+ "model.layers.47.input_layernorm.weight": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.0.down_proj.weight": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.0.down_proj.weight_scale": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.0.gate_proj.weight": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.0.gate_proj.weight_scale": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.0.up_proj.weight": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.0.up_proj.weight_scale": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.1.down_proj.weight": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.1.down_proj.weight_scale": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.1.gate_proj.weight": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.1.gate_proj.weight_scale": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.1.up_proj.weight": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.1.up_proj.weight_scale": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.10.down_proj.weight": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.10.down_proj.weight_scale": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.10.gate_proj.weight": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.10.gate_proj.weight_scale": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.10.up_proj.weight": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.10.up_proj.weight_scale": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.100.down_proj.weight": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.100.down_proj.weight_scale": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.100.gate_proj.weight": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.100.gate_proj.weight_scale": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.100.up_proj.weight": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.100.up_proj.weight_scale": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.101.down_proj.weight": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.101.down_proj.weight_scale": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.101.gate_proj.weight": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.101.gate_proj.weight_scale": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.101.up_proj.weight": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.101.up_proj.weight_scale": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.102.down_proj.weight": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.102.down_proj.weight_scale": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.102.gate_proj.weight": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.102.gate_proj.weight_scale": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.102.up_proj.weight": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.102.up_proj.weight_scale": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.103.down_proj.weight": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.103.down_proj.weight_scale": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.103.gate_proj.weight": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.103.gate_proj.weight_scale": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.103.up_proj.weight": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.103.up_proj.weight_scale": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.104.down_proj.weight": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.104.down_proj.weight_scale": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.104.gate_proj.weight": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.104.gate_proj.weight_scale": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.104.up_proj.weight": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.104.up_proj.weight_scale": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.105.down_proj.weight": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.105.down_proj.weight_scale": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.105.gate_proj.weight": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.105.gate_proj.weight_scale": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.105.up_proj.weight": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.105.up_proj.weight_scale": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.106.down_proj.weight": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.106.down_proj.weight_scale": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.106.gate_proj.weight": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.106.gate_proj.weight_scale": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.106.up_proj.weight": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.106.up_proj.weight_scale": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.107.down_proj.weight": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.107.down_proj.weight_scale": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.107.gate_proj.weight": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.107.gate_proj.weight_scale": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.107.up_proj.weight": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.107.up_proj.weight_scale": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.108.down_proj.weight": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.108.down_proj.weight_scale": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.108.gate_proj.weight": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.108.gate_proj.weight_scale": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.108.up_proj.weight": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.108.up_proj.weight_scale": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.109.down_proj.weight": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.109.down_proj.weight_scale": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.109.gate_proj.weight": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.109.gate_proj.weight_scale": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.109.up_proj.weight": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.109.up_proj.weight_scale": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.11.down_proj.weight": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.11.down_proj.weight_scale": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.11.gate_proj.weight": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.11.gate_proj.weight_scale": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.11.up_proj.weight": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.11.up_proj.weight_scale": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.110.down_proj.weight": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.110.down_proj.weight_scale": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.110.gate_proj.weight": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.110.gate_proj.weight_scale": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.110.up_proj.weight": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.110.up_proj.weight_scale": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.111.down_proj.weight": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.111.down_proj.weight_scale": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.111.gate_proj.weight": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.111.gate_proj.weight_scale": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.111.up_proj.weight": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.111.up_proj.weight_scale": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.112.down_proj.weight": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.112.down_proj.weight_scale": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.112.gate_proj.weight": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.112.gate_proj.weight_scale": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.112.up_proj.weight": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.112.up_proj.weight_scale": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.113.down_proj.weight": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.113.down_proj.weight_scale": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.113.gate_proj.weight": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.113.gate_proj.weight_scale": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.113.up_proj.weight": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.113.up_proj.weight_scale": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.114.down_proj.weight": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.114.down_proj.weight_scale": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.114.gate_proj.weight": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.114.gate_proj.weight_scale": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.114.up_proj.weight": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.114.up_proj.weight_scale": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.115.down_proj.weight": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.115.down_proj.weight_scale": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.115.gate_proj.weight": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.115.gate_proj.weight_scale": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.115.up_proj.weight": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.115.up_proj.weight_scale": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.116.down_proj.weight": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.116.down_proj.weight_scale": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.116.gate_proj.weight": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.116.gate_proj.weight_scale": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.116.up_proj.weight": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.116.up_proj.weight_scale": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.117.down_proj.weight": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.117.down_proj.weight_scale": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.117.gate_proj.weight": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.117.gate_proj.weight_scale": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.117.up_proj.weight": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.117.up_proj.weight_scale": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.118.down_proj.weight": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.118.down_proj.weight_scale": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.118.gate_proj.weight": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.118.gate_proj.weight_scale": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.118.up_proj.weight": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.118.up_proj.weight_scale": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.119.down_proj.weight": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.119.down_proj.weight_scale": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.119.gate_proj.weight": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.119.gate_proj.weight_scale": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.119.up_proj.weight": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.119.up_proj.weight_scale": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.12.down_proj.weight": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.12.down_proj.weight_scale": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.12.gate_proj.weight": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.12.gate_proj.weight_scale": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.12.up_proj.weight": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.12.up_proj.weight_scale": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.120.down_proj.weight": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.120.down_proj.weight_scale": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.120.gate_proj.weight": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.120.gate_proj.weight_scale": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.120.up_proj.weight": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.120.up_proj.weight_scale": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.121.down_proj.weight": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.121.down_proj.weight_scale": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.121.gate_proj.weight": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.121.gate_proj.weight_scale": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.121.up_proj.weight": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.121.up_proj.weight_scale": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.122.down_proj.weight": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.122.down_proj.weight_scale": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.122.gate_proj.weight": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.122.gate_proj.weight_scale": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.122.up_proj.weight": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.122.up_proj.weight_scale": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.123.down_proj.weight": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.123.down_proj.weight_scale": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.123.gate_proj.weight": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.123.gate_proj.weight_scale": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.123.up_proj.weight": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.123.up_proj.weight_scale": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.124.down_proj.weight": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.124.down_proj.weight_scale": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.124.gate_proj.weight": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.124.gate_proj.weight_scale": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.124.up_proj.weight": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.124.up_proj.weight_scale": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.125.down_proj.weight": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.125.down_proj.weight_scale": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.125.gate_proj.weight": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.125.gate_proj.weight_scale": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.125.up_proj.weight": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.125.up_proj.weight_scale": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.126.down_proj.weight": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.126.down_proj.weight_scale": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.126.gate_proj.weight": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.126.gate_proj.weight_scale": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.126.up_proj.weight": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.126.up_proj.weight_scale": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.127.down_proj.weight": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.127.down_proj.weight_scale": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.127.gate_proj.weight": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.127.gate_proj.weight_scale": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.127.up_proj.weight": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.127.up_proj.weight_scale": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.128.down_proj.weight": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.128.down_proj.weight_scale": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.128.gate_proj.weight": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.128.gate_proj.weight_scale": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.128.up_proj.weight": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.128.up_proj.weight_scale": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.129.down_proj.weight": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.129.down_proj.weight_scale": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.129.gate_proj.weight": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.129.gate_proj.weight_scale": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.129.up_proj.weight": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.129.up_proj.weight_scale": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.13.down_proj.weight": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.13.down_proj.weight_scale": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.13.gate_proj.weight": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.13.gate_proj.weight_scale": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.13.up_proj.weight": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.13.up_proj.weight_scale": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.130.down_proj.weight": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.130.down_proj.weight_scale": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.130.gate_proj.weight": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.130.gate_proj.weight_scale": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.130.up_proj.weight": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.130.up_proj.weight_scale": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.131.down_proj.weight": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.131.down_proj.weight_scale": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.131.gate_proj.weight": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.131.gate_proj.weight_scale": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.131.up_proj.weight": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.131.up_proj.weight_scale": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.132.down_proj.weight": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.132.down_proj.weight_scale": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.132.gate_proj.weight": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.132.gate_proj.weight_scale": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.132.up_proj.weight": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.132.up_proj.weight_scale": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.133.down_proj.weight": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.133.down_proj.weight_scale": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.133.gate_proj.weight": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.133.gate_proj.weight_scale": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.133.up_proj.weight": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.133.up_proj.weight_scale": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.134.down_proj.weight": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.134.down_proj.weight_scale": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.134.gate_proj.weight": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.134.gate_proj.weight_scale": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.134.up_proj.weight": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.134.up_proj.weight_scale": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.135.down_proj.weight": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.135.down_proj.weight_scale": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.135.gate_proj.weight": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.135.gate_proj.weight_scale": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.135.up_proj.weight": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.135.up_proj.weight_scale": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.136.down_proj.weight": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.136.down_proj.weight_scale": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.136.gate_proj.weight": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.136.gate_proj.weight_scale": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.136.up_proj.weight": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.136.up_proj.weight_scale": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.137.down_proj.weight": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.137.down_proj.weight_scale": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.137.gate_proj.weight": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.137.gate_proj.weight_scale": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.137.up_proj.weight": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.137.up_proj.weight_scale": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.138.down_proj.weight": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.138.down_proj.weight_scale": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.138.gate_proj.weight": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.138.gate_proj.weight_scale": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.138.up_proj.weight": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.138.up_proj.weight_scale": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.139.down_proj.weight": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.139.down_proj.weight_scale": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.139.gate_proj.weight": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.139.gate_proj.weight_scale": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.139.up_proj.weight": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.139.up_proj.weight_scale": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.14.down_proj.weight": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.14.down_proj.weight_scale": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.14.gate_proj.weight": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.14.gate_proj.weight_scale": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.14.up_proj.weight": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.14.up_proj.weight_scale": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.140.down_proj.weight": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.140.down_proj.weight_scale": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.140.gate_proj.weight": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.140.gate_proj.weight_scale": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.140.up_proj.weight": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.140.up_proj.weight_scale": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.141.down_proj.weight": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.141.down_proj.weight_scale": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.141.gate_proj.weight": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.141.gate_proj.weight_scale": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.141.up_proj.weight": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.141.up_proj.weight_scale": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.142.down_proj.weight": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.142.down_proj.weight_scale": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.142.gate_proj.weight": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.142.gate_proj.weight_scale": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.142.up_proj.weight": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.142.up_proj.weight_scale": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.143.down_proj.weight": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.143.down_proj.weight_scale": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.143.gate_proj.weight": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.143.gate_proj.weight_scale": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.143.up_proj.weight": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.143.up_proj.weight_scale": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.144.down_proj.weight": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.144.down_proj.weight_scale": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.144.gate_proj.weight": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.144.gate_proj.weight_scale": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.144.up_proj.weight": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.144.up_proj.weight_scale": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.145.down_proj.weight": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.145.down_proj.weight_scale": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.145.gate_proj.weight": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.145.gate_proj.weight_scale": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.145.up_proj.weight": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.145.up_proj.weight_scale": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.146.down_proj.weight": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.146.down_proj.weight_scale": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.146.gate_proj.weight": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.146.gate_proj.weight_scale": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.146.up_proj.weight": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.146.up_proj.weight_scale": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.147.down_proj.weight": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.147.down_proj.weight_scale": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.147.gate_proj.weight": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.147.gate_proj.weight_scale": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.147.up_proj.weight": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.147.up_proj.weight_scale": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.148.down_proj.weight": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.148.down_proj.weight_scale": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.148.gate_proj.weight": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.148.gate_proj.weight_scale": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.148.up_proj.weight": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.148.up_proj.weight_scale": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.149.down_proj.weight": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.149.down_proj.weight_scale": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.149.gate_proj.weight": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.149.gate_proj.weight_scale": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.149.up_proj.weight": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.149.up_proj.weight_scale": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.15.down_proj.weight": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.15.down_proj.weight_scale": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.15.gate_proj.weight": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.15.gate_proj.weight_scale": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.15.up_proj.weight": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.15.up_proj.weight_scale": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.150.down_proj.weight": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.150.down_proj.weight_scale": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.150.gate_proj.weight": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.150.gate_proj.weight_scale": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.150.up_proj.weight": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.150.up_proj.weight_scale": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.151.down_proj.weight": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.151.down_proj.weight_scale": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.151.gate_proj.weight": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.151.gate_proj.weight_scale": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.151.up_proj.weight": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.151.up_proj.weight_scale": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.152.down_proj.weight": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.152.down_proj.weight_scale": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.152.gate_proj.weight": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.152.gate_proj.weight_scale": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.152.up_proj.weight": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.152.up_proj.weight_scale": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.153.down_proj.weight": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.153.down_proj.weight_scale": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.153.gate_proj.weight": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.153.gate_proj.weight_scale": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.153.up_proj.weight": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.153.up_proj.weight_scale": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.154.down_proj.weight": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.154.down_proj.weight_scale": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.154.gate_proj.weight": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.154.gate_proj.weight_scale": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.154.up_proj.weight": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.154.up_proj.weight_scale": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.155.down_proj.weight": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.155.down_proj.weight_scale": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.155.gate_proj.weight": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.155.gate_proj.weight_scale": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.155.up_proj.weight": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.155.up_proj.weight_scale": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.156.down_proj.weight": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.156.down_proj.weight_scale": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.156.gate_proj.weight": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.156.gate_proj.weight_scale": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.156.up_proj.weight": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.156.up_proj.weight_scale": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.157.down_proj.weight": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.157.down_proj.weight_scale": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.157.gate_proj.weight": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.157.gate_proj.weight_scale": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.157.up_proj.weight": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.157.up_proj.weight_scale": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.158.down_proj.weight": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.158.down_proj.weight_scale": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.158.gate_proj.weight": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.158.gate_proj.weight_scale": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.158.up_proj.weight": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.158.up_proj.weight_scale": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.159.down_proj.weight": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.159.down_proj.weight_scale": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.159.gate_proj.weight": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.159.gate_proj.weight_scale": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.159.up_proj.weight": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.159.up_proj.weight_scale": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.16.down_proj.weight": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.16.down_proj.weight_scale": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.16.gate_proj.weight": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.16.gate_proj.weight_scale": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.16.up_proj.weight": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.16.up_proj.weight_scale": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.17.down_proj.weight": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.17.down_proj.weight_scale": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.17.gate_proj.weight": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.17.gate_proj.weight_scale": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.17.up_proj.weight": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.17.up_proj.weight_scale": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.18.down_proj.weight": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.18.down_proj.weight_scale": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.18.gate_proj.weight": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.18.gate_proj.weight_scale": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.18.up_proj.weight": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.18.up_proj.weight_scale": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.19.down_proj.weight": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.19.down_proj.weight_scale": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.19.gate_proj.weight": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.19.gate_proj.weight_scale": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.19.up_proj.weight": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.19.up_proj.weight_scale": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.2.down_proj.weight": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.2.down_proj.weight_scale": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.2.gate_proj.weight": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.2.gate_proj.weight_scale": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.2.up_proj.weight": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.2.up_proj.weight_scale": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.20.down_proj.weight": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.20.down_proj.weight_scale": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.20.gate_proj.weight": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.20.gate_proj.weight_scale": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.20.up_proj.weight": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.20.up_proj.weight_scale": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.21.down_proj.weight": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.21.down_proj.weight_scale": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.21.gate_proj.weight": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.21.gate_proj.weight_scale": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.21.up_proj.weight": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.21.up_proj.weight_scale": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.22.down_proj.weight": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.22.down_proj.weight_scale": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.22.gate_proj.weight": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.22.gate_proj.weight_scale": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.22.up_proj.weight": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.22.up_proj.weight_scale": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.23.down_proj.weight": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.23.down_proj.weight_scale": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.23.gate_proj.weight": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.23.gate_proj.weight_scale": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.23.up_proj.weight": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.23.up_proj.weight_scale": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.24.down_proj.weight": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.24.down_proj.weight_scale": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.24.gate_proj.weight": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.24.gate_proj.weight_scale": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.24.up_proj.weight": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.24.up_proj.weight_scale": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.25.down_proj.weight": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.25.down_proj.weight_scale": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.25.gate_proj.weight": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.25.gate_proj.weight_scale": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.25.up_proj.weight": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.25.up_proj.weight_scale": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.26.down_proj.weight": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.26.down_proj.weight_scale": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.26.gate_proj.weight": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.26.gate_proj.weight_scale": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.26.up_proj.weight": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.26.up_proj.weight_scale": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.27.down_proj.weight": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.27.down_proj.weight_scale": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.27.gate_proj.weight": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.27.gate_proj.weight_scale": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.27.up_proj.weight": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.27.up_proj.weight_scale": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.28.down_proj.weight": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.28.down_proj.weight_scale": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.28.gate_proj.weight": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.28.gate_proj.weight_scale": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.28.up_proj.weight": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.28.up_proj.weight_scale": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.29.down_proj.weight": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.29.down_proj.weight_scale": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.29.gate_proj.weight": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.29.gate_proj.weight_scale": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.29.up_proj.weight": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.29.up_proj.weight_scale": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.3.down_proj.weight": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.3.down_proj.weight_scale": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.3.gate_proj.weight": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.3.gate_proj.weight_scale": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.3.up_proj.weight": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.3.up_proj.weight_scale": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.30.down_proj.weight": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.30.down_proj.weight_scale": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.30.gate_proj.weight": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.30.gate_proj.weight_scale": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.30.up_proj.weight": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.30.up_proj.weight_scale": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.31.down_proj.weight": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.31.down_proj.weight_scale": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.31.gate_proj.weight": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.31.gate_proj.weight_scale": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.31.up_proj.weight": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.31.up_proj.weight_scale": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.32.down_proj.weight": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.32.down_proj.weight_scale": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.32.gate_proj.weight": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.32.gate_proj.weight_scale": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.32.up_proj.weight": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.32.up_proj.weight_scale": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.33.down_proj.weight": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.33.down_proj.weight_scale": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.33.gate_proj.weight": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.33.gate_proj.weight_scale": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.33.up_proj.weight": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.33.up_proj.weight_scale": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.34.down_proj.weight": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.34.down_proj.weight_scale": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.34.gate_proj.weight": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.34.gate_proj.weight_scale": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.34.up_proj.weight": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.34.up_proj.weight_scale": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.35.down_proj.weight": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.35.down_proj.weight_scale": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.35.gate_proj.weight": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.35.gate_proj.weight_scale": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.35.up_proj.weight": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.35.up_proj.weight_scale": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.36.down_proj.weight": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.36.down_proj.weight_scale": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.36.gate_proj.weight": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.36.gate_proj.weight_scale": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.36.up_proj.weight": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.36.up_proj.weight_scale": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.37.down_proj.weight": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.37.down_proj.weight_scale": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.37.gate_proj.weight": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.37.gate_proj.weight_scale": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.37.up_proj.weight": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.37.up_proj.weight_scale": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.38.down_proj.weight": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.38.down_proj.weight_scale": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.38.gate_proj.weight": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.38.gate_proj.weight_scale": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.38.up_proj.weight": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.38.up_proj.weight_scale": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.39.down_proj.weight": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.39.down_proj.weight_scale": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.39.gate_proj.weight": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.39.gate_proj.weight_scale": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.39.up_proj.weight": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.39.up_proj.weight_scale": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.4.down_proj.weight": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.4.down_proj.weight_scale": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.4.gate_proj.weight": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.4.gate_proj.weight_scale": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.4.up_proj.weight": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.4.up_proj.weight_scale": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.40.down_proj.weight": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.40.down_proj.weight_scale": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.40.gate_proj.weight": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.40.gate_proj.weight_scale": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.40.up_proj.weight": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.40.up_proj.weight_scale": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.41.down_proj.weight": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.41.down_proj.weight_scale": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.41.gate_proj.weight": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.41.gate_proj.weight_scale": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.41.up_proj.weight": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.41.up_proj.weight_scale": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.42.down_proj.weight": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.42.down_proj.weight_scale": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.42.gate_proj.weight": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.42.gate_proj.weight_scale": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.42.up_proj.weight": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.42.up_proj.weight_scale": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.43.down_proj.weight": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.43.down_proj.weight_scale": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.43.gate_proj.weight": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.43.gate_proj.weight_scale": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.43.up_proj.weight": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.43.up_proj.weight_scale": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.44.down_proj.weight": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.44.down_proj.weight_scale": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.44.gate_proj.weight": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.44.gate_proj.weight_scale": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.44.up_proj.weight": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.44.up_proj.weight_scale": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.45.down_proj.weight": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.45.down_proj.weight_scale": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.45.gate_proj.weight": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.45.gate_proj.weight_scale": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.45.up_proj.weight": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.45.up_proj.weight_scale": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.46.down_proj.weight": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.46.down_proj.weight_scale": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.46.gate_proj.weight": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.46.gate_proj.weight_scale": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.46.up_proj.weight": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.46.up_proj.weight_scale": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.47.down_proj.weight": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.47.down_proj.weight_scale": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.47.gate_proj.weight": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.47.gate_proj.weight_scale": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.47.up_proj.weight": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.47.up_proj.weight_scale": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.48.down_proj.weight": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.48.down_proj.weight_scale": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.48.gate_proj.weight": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.48.gate_proj.weight_scale": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.48.up_proj.weight": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.48.up_proj.weight_scale": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.49.down_proj.weight": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.49.down_proj.weight_scale": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.49.gate_proj.weight": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.49.gate_proj.weight_scale": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.49.up_proj.weight": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.49.up_proj.weight_scale": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.5.down_proj.weight": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.5.down_proj.weight_scale": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.5.gate_proj.weight": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.5.gate_proj.weight_scale": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.5.up_proj.weight": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.5.up_proj.weight_scale": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.50.down_proj.weight": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.50.down_proj.weight_scale": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.50.gate_proj.weight": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.50.gate_proj.weight_scale": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.50.up_proj.weight": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.50.up_proj.weight_scale": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.51.down_proj.weight": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.51.down_proj.weight_scale": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.51.gate_proj.weight": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.51.gate_proj.weight_scale": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.51.up_proj.weight": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.51.up_proj.weight_scale": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.52.down_proj.weight": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.52.down_proj.weight_scale": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.52.gate_proj.weight": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.52.gate_proj.weight_scale": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.52.up_proj.weight": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.52.up_proj.weight_scale": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.53.down_proj.weight": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.53.down_proj.weight_scale": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.53.gate_proj.weight": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.53.gate_proj.weight_scale": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.53.up_proj.weight": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.53.up_proj.weight_scale": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.54.down_proj.weight": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.54.down_proj.weight_scale": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.54.gate_proj.weight": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.54.gate_proj.weight_scale": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.54.up_proj.weight": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.54.up_proj.weight_scale": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.55.down_proj.weight": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.55.down_proj.weight_scale": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.55.gate_proj.weight": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.55.gate_proj.weight_scale": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.55.up_proj.weight": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.55.up_proj.weight_scale": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.56.down_proj.weight": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.56.down_proj.weight_scale": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.56.gate_proj.weight": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.56.gate_proj.weight_scale": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.56.up_proj.weight": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.56.up_proj.weight_scale": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.57.down_proj.weight": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.57.down_proj.weight_scale": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.57.gate_proj.weight": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.57.gate_proj.weight_scale": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.57.up_proj.weight": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.57.up_proj.weight_scale": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.58.down_proj.weight": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.58.down_proj.weight_scale": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.58.gate_proj.weight": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.58.gate_proj.weight_scale": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.58.up_proj.weight": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.58.up_proj.weight_scale": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.59.down_proj.weight": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.59.down_proj.weight_scale": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.59.gate_proj.weight": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.59.gate_proj.weight_scale": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.59.up_proj.weight": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.59.up_proj.weight_scale": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.6.down_proj.weight": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.6.down_proj.weight_scale": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.6.gate_proj.weight": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.6.gate_proj.weight_scale": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.6.up_proj.weight": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.6.up_proj.weight_scale": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.60.down_proj.weight": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.60.down_proj.weight_scale": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.60.gate_proj.weight": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.60.gate_proj.weight_scale": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.60.up_proj.weight": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.60.up_proj.weight_scale": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.61.down_proj.weight": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.61.down_proj.weight_scale": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.61.gate_proj.weight": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.61.gate_proj.weight_scale": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.61.up_proj.weight": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.61.up_proj.weight_scale": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.62.down_proj.weight": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.62.down_proj.weight_scale": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.62.gate_proj.weight": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.62.gate_proj.weight_scale": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.62.up_proj.weight": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.62.up_proj.weight_scale": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.63.down_proj.weight": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.63.down_proj.weight_scale": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.63.gate_proj.weight": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.63.gate_proj.weight_scale": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.63.up_proj.weight": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.63.up_proj.weight_scale": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.64.down_proj.weight": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.64.down_proj.weight_scale": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.64.gate_proj.weight": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.64.gate_proj.weight_scale": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.64.up_proj.weight": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.64.up_proj.weight_scale": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.65.down_proj.weight": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.65.down_proj.weight_scale": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.65.gate_proj.weight": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.65.gate_proj.weight_scale": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.65.up_proj.weight": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.65.up_proj.weight_scale": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.66.down_proj.weight": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.66.down_proj.weight_scale": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.66.gate_proj.weight": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.66.gate_proj.weight_scale": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.66.up_proj.weight": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.66.up_proj.weight_scale": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.67.down_proj.weight": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.67.down_proj.weight_scale": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.67.gate_proj.weight": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.67.gate_proj.weight_scale": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.67.up_proj.weight": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.67.up_proj.weight_scale": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.68.down_proj.weight": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.68.down_proj.weight_scale": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.68.gate_proj.weight": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.68.gate_proj.weight_scale": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.68.up_proj.weight": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.68.up_proj.weight_scale": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.69.down_proj.weight": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.69.down_proj.weight_scale": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.69.gate_proj.weight": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.69.gate_proj.weight_scale": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.69.up_proj.weight": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.69.up_proj.weight_scale": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.7.down_proj.weight": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.7.down_proj.weight_scale": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.7.gate_proj.weight": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.7.gate_proj.weight_scale": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.7.up_proj.weight": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.7.up_proj.weight_scale": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.70.down_proj.weight": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.70.down_proj.weight_scale": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.70.gate_proj.weight": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.70.gate_proj.weight_scale": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.70.up_proj.weight": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.70.up_proj.weight_scale": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.71.down_proj.weight": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.71.down_proj.weight_scale": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.71.gate_proj.weight": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.71.gate_proj.weight_scale": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.71.up_proj.weight": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.71.up_proj.weight_scale": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.72.down_proj.weight": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.72.down_proj.weight_scale": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.72.gate_proj.weight": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.72.gate_proj.weight_scale": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.72.up_proj.weight": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.72.up_proj.weight_scale": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.73.down_proj.weight": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.73.down_proj.weight_scale": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.73.gate_proj.weight": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.73.gate_proj.weight_scale": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.73.up_proj.weight": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.73.up_proj.weight_scale": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.74.down_proj.weight": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.74.down_proj.weight_scale": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.74.gate_proj.weight": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.74.gate_proj.weight_scale": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.74.up_proj.weight": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.74.up_proj.weight_scale": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.75.down_proj.weight": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.75.down_proj.weight_scale": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.75.gate_proj.weight": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.75.gate_proj.weight_scale": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.75.up_proj.weight": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.75.up_proj.weight_scale": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.76.down_proj.weight": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.76.down_proj.weight_scale": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.76.gate_proj.weight": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.76.gate_proj.weight_scale": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.76.up_proj.weight": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.76.up_proj.weight_scale": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.77.down_proj.weight": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.77.down_proj.weight_scale": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.77.gate_proj.weight": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.77.gate_proj.weight_scale": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.77.up_proj.weight": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.77.up_proj.weight_scale": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.78.down_proj.weight": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.78.down_proj.weight_scale": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.78.gate_proj.weight": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.78.gate_proj.weight_scale": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.78.up_proj.weight": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.78.up_proj.weight_scale": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.79.down_proj.weight": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.79.down_proj.weight_scale": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.79.gate_proj.weight": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.79.gate_proj.weight_scale": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.79.up_proj.weight": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.79.up_proj.weight_scale": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.8.down_proj.weight": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.8.down_proj.weight_scale": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.8.gate_proj.weight": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.8.gate_proj.weight_scale": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.8.up_proj.weight": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.8.up_proj.weight_scale": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.80.down_proj.weight": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.80.down_proj.weight_scale": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.80.gate_proj.weight": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.80.gate_proj.weight_scale": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.80.up_proj.weight": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.80.up_proj.weight_scale": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.81.down_proj.weight": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.81.down_proj.weight_scale": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.81.gate_proj.weight": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.81.gate_proj.weight_scale": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.81.up_proj.weight": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.81.up_proj.weight_scale": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.82.down_proj.weight": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.82.down_proj.weight_scale": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.82.gate_proj.weight": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.82.gate_proj.weight_scale": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.82.up_proj.weight": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.82.up_proj.weight_scale": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.83.down_proj.weight": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.83.down_proj.weight_scale": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.83.gate_proj.weight": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.83.gate_proj.weight_scale": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.83.up_proj.weight": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.83.up_proj.weight_scale": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.84.down_proj.weight": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.84.down_proj.weight_scale": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.84.gate_proj.weight": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.84.gate_proj.weight_scale": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.84.up_proj.weight": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.84.up_proj.weight_scale": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.85.down_proj.weight": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.85.down_proj.weight_scale": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.85.gate_proj.weight": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.85.gate_proj.weight_scale": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.85.up_proj.weight": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.85.up_proj.weight_scale": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.86.down_proj.weight": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.86.down_proj.weight_scale": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.86.gate_proj.weight": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.86.gate_proj.weight_scale": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.86.up_proj.weight": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.86.up_proj.weight_scale": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.87.down_proj.weight": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.87.down_proj.weight_scale": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.87.gate_proj.weight": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.87.gate_proj.weight_scale": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.87.up_proj.weight": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.87.up_proj.weight_scale": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.88.down_proj.weight": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.88.down_proj.weight_scale": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.88.gate_proj.weight": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.88.gate_proj.weight_scale": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.88.up_proj.weight": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.88.up_proj.weight_scale": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.89.down_proj.weight": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.89.down_proj.weight_scale": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.89.gate_proj.weight": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.89.gate_proj.weight_scale": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.89.up_proj.weight": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.89.up_proj.weight_scale": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.9.down_proj.weight": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.9.down_proj.weight_scale": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.9.gate_proj.weight": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.9.gate_proj.weight_scale": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.9.up_proj.weight": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.9.up_proj.weight_scale": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.90.down_proj.weight": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.90.down_proj.weight_scale": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.90.gate_proj.weight": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.90.gate_proj.weight_scale": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.90.up_proj.weight": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.90.up_proj.weight_scale": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.91.down_proj.weight": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.91.down_proj.weight_scale": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.91.gate_proj.weight": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.91.gate_proj.weight_scale": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.91.up_proj.weight": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.91.up_proj.weight_scale": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.92.down_proj.weight": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.92.down_proj.weight_scale": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.92.gate_proj.weight": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.92.gate_proj.weight_scale": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.92.up_proj.weight": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.92.up_proj.weight_scale": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.93.down_proj.weight": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.93.down_proj.weight_scale": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.93.gate_proj.weight": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.93.gate_proj.weight_scale": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.93.up_proj.weight": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.93.up_proj.weight_scale": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.94.down_proj.weight": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.94.down_proj.weight_scale": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.94.gate_proj.weight": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.94.gate_proj.weight_scale": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.94.up_proj.weight": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.94.up_proj.weight_scale": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.95.down_proj.weight": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.95.down_proj.weight_scale": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.95.gate_proj.weight": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.95.gate_proj.weight_scale": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.95.up_proj.weight": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.95.up_proj.weight_scale": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.96.down_proj.weight": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.96.down_proj.weight_scale": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.96.gate_proj.weight": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.96.gate_proj.weight_scale": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.96.up_proj.weight": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.96.up_proj.weight_scale": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.97.down_proj.weight": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.97.down_proj.weight_scale": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.97.gate_proj.weight": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.97.gate_proj.weight_scale": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.97.up_proj.weight": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.97.up_proj.weight_scale": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.98.down_proj.weight": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.98.down_proj.weight_scale": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.98.gate_proj.weight": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.98.gate_proj.weight_scale": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.98.up_proj.weight": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.98.up_proj.weight_scale": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.99.down_proj.weight": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.99.down_proj.weight_scale": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.99.gate_proj.weight": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.99.gate_proj.weight_scale": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.99.up_proj.weight": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.99.up_proj.weight_scale": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.gate.e_score_correction_bias": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.gate.weight": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.shared_experts.down_proj.weight": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.shared_experts.down_proj.weight_scale": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.shared_experts.gate_proj.weight": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.shared_experts.gate_proj.weight_scale": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.shared_experts.up_proj.weight": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.shared_experts.up_proj.weight_scale": "model-00048-of-00092.safetensors",
+ "model.layers.47.post_attention_layernorm.weight": "model-00048-of-00092.safetensors",
+ "model.layers.47.self_attn.k_norm.weight": "model-00048-of-00092.safetensors",
+ "model.layers.47.self_attn.k_proj.bias": "model-00048-of-00092.safetensors",
+ "model.layers.47.self_attn.k_proj.weight": "model-00048-of-00092.safetensors",
+ "model.layers.47.self_attn.k_proj.weight_scale": "model-00048-of-00092.safetensors",
+ "model.layers.47.self_attn.o_proj.weight": "model-00048-of-00092.safetensors",
+ "model.layers.47.self_attn.o_proj.weight_scale": "model-00048-of-00092.safetensors",
+ "model.layers.47.self_attn.q_norm.weight": "model-00048-of-00092.safetensors",
+ "model.layers.47.self_attn.q_proj.bias": "model-00048-of-00092.safetensors",
+ "model.layers.47.self_attn.q_proj.weight": "model-00048-of-00092.safetensors",
+ "model.layers.47.self_attn.q_proj.weight_scale": "model-00048-of-00092.safetensors",
+ "model.layers.47.self_attn.v_proj.bias": "model-00048-of-00092.safetensors",
+ "model.layers.47.self_attn.v_proj.weight": "model-00048-of-00092.safetensors",
+ "model.layers.47.self_attn.v_proj.weight_scale": "model-00048-of-00092.safetensors",
+ "model.layers.48.input_layernorm.weight": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.0.down_proj.weight": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.0.down_proj.weight_scale": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.0.gate_proj.weight": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.0.gate_proj.weight_scale": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.0.up_proj.weight": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.0.up_proj.weight_scale": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.1.down_proj.weight": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.1.down_proj.weight_scale": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.1.gate_proj.weight": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.1.gate_proj.weight_scale": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.1.up_proj.weight": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.1.up_proj.weight_scale": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.10.down_proj.weight": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.10.down_proj.weight_scale": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.10.gate_proj.weight": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.10.gate_proj.weight_scale": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.10.up_proj.weight": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.10.up_proj.weight_scale": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.100.down_proj.weight": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.100.down_proj.weight_scale": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.100.gate_proj.weight": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.100.gate_proj.weight_scale": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.100.up_proj.weight": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.100.up_proj.weight_scale": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.101.down_proj.weight": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.101.down_proj.weight_scale": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.101.gate_proj.weight": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.101.gate_proj.weight_scale": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.101.up_proj.weight": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.101.up_proj.weight_scale": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.102.down_proj.weight": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.102.down_proj.weight_scale": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.102.gate_proj.weight": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.102.gate_proj.weight_scale": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.102.up_proj.weight": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.102.up_proj.weight_scale": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.103.down_proj.weight": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.103.down_proj.weight_scale": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.103.gate_proj.weight": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.103.gate_proj.weight_scale": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.103.up_proj.weight": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.103.up_proj.weight_scale": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.104.down_proj.weight": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.104.down_proj.weight_scale": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.104.gate_proj.weight": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.104.gate_proj.weight_scale": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.104.up_proj.weight": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.104.up_proj.weight_scale": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.105.down_proj.weight": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.105.down_proj.weight_scale": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.105.gate_proj.weight": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.105.gate_proj.weight_scale": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.105.up_proj.weight": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.105.up_proj.weight_scale": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.106.down_proj.weight": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.106.down_proj.weight_scale": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.106.gate_proj.weight": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.106.gate_proj.weight_scale": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.106.up_proj.weight": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.106.up_proj.weight_scale": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.107.down_proj.weight": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.107.down_proj.weight_scale": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.107.gate_proj.weight": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.107.gate_proj.weight_scale": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.107.up_proj.weight": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.107.up_proj.weight_scale": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.108.down_proj.weight": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.108.down_proj.weight_scale": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.108.gate_proj.weight": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.108.gate_proj.weight_scale": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.108.up_proj.weight": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.108.up_proj.weight_scale": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.109.down_proj.weight": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.109.down_proj.weight_scale": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.109.gate_proj.weight": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.109.gate_proj.weight_scale": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.109.up_proj.weight": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.109.up_proj.weight_scale": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.11.down_proj.weight": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.11.down_proj.weight_scale": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.11.gate_proj.weight": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.11.gate_proj.weight_scale": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.11.up_proj.weight": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.11.up_proj.weight_scale": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.110.down_proj.weight": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.110.down_proj.weight_scale": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.110.gate_proj.weight": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.110.gate_proj.weight_scale": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.110.up_proj.weight": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.110.up_proj.weight_scale": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.111.down_proj.weight": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.111.down_proj.weight_scale": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.111.gate_proj.weight": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.111.gate_proj.weight_scale": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.111.up_proj.weight": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.111.up_proj.weight_scale": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.112.down_proj.weight": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.112.down_proj.weight_scale": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.112.gate_proj.weight": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.112.gate_proj.weight_scale": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.112.up_proj.weight": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.112.up_proj.weight_scale": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.113.down_proj.weight": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.113.down_proj.weight_scale": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.113.gate_proj.weight": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.113.gate_proj.weight_scale": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.113.up_proj.weight": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.113.up_proj.weight_scale": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.114.down_proj.weight": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.114.down_proj.weight_scale": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.114.gate_proj.weight": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.114.gate_proj.weight_scale": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.114.up_proj.weight": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.114.up_proj.weight_scale": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.115.down_proj.weight": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.115.down_proj.weight_scale": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.115.gate_proj.weight": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.115.gate_proj.weight_scale": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.115.up_proj.weight": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.115.up_proj.weight_scale": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.116.down_proj.weight": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.116.down_proj.weight_scale": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.116.gate_proj.weight": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.116.gate_proj.weight_scale": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.116.up_proj.weight": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.116.up_proj.weight_scale": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.117.down_proj.weight": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.117.down_proj.weight_scale": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.117.gate_proj.weight": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.117.gate_proj.weight_scale": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.117.up_proj.weight": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.117.up_proj.weight_scale": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.118.down_proj.weight": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.118.down_proj.weight_scale": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.118.gate_proj.weight": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.118.gate_proj.weight_scale": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.118.up_proj.weight": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.118.up_proj.weight_scale": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.119.down_proj.weight": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.119.down_proj.weight_scale": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.119.gate_proj.weight": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.119.gate_proj.weight_scale": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.119.up_proj.weight": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.119.up_proj.weight_scale": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.12.down_proj.weight": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.12.down_proj.weight_scale": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.12.gate_proj.weight": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.12.gate_proj.weight_scale": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.12.up_proj.weight": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.12.up_proj.weight_scale": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.120.down_proj.weight": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.120.down_proj.weight_scale": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.120.gate_proj.weight": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.120.gate_proj.weight_scale": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.120.up_proj.weight": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.120.up_proj.weight_scale": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.121.down_proj.weight": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.121.down_proj.weight_scale": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.121.gate_proj.weight": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.121.gate_proj.weight_scale": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.121.up_proj.weight": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.121.up_proj.weight_scale": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.122.down_proj.weight": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.122.down_proj.weight_scale": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.122.gate_proj.weight": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.122.gate_proj.weight_scale": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.122.up_proj.weight": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.122.up_proj.weight_scale": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.123.down_proj.weight": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.123.down_proj.weight_scale": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.123.gate_proj.weight": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.123.gate_proj.weight_scale": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.123.up_proj.weight": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.123.up_proj.weight_scale": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.124.down_proj.weight": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.124.down_proj.weight_scale": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.124.gate_proj.weight": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.124.gate_proj.weight_scale": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.124.up_proj.weight": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.124.up_proj.weight_scale": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.125.down_proj.weight": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.125.down_proj.weight_scale": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.125.gate_proj.weight": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.125.gate_proj.weight_scale": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.125.up_proj.weight": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.125.up_proj.weight_scale": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.126.down_proj.weight": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.126.down_proj.weight_scale": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.126.gate_proj.weight": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.126.gate_proj.weight_scale": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.126.up_proj.weight": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.126.up_proj.weight_scale": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.127.down_proj.weight": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.127.down_proj.weight_scale": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.127.gate_proj.weight": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.127.gate_proj.weight_scale": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.127.up_proj.weight": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.127.up_proj.weight_scale": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.128.down_proj.weight": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.128.down_proj.weight_scale": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.128.gate_proj.weight": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.128.gate_proj.weight_scale": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.128.up_proj.weight": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.128.up_proj.weight_scale": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.129.down_proj.weight": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.129.down_proj.weight_scale": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.129.gate_proj.weight": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.129.gate_proj.weight_scale": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.129.up_proj.weight": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.129.up_proj.weight_scale": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.13.down_proj.weight": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.13.down_proj.weight_scale": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.13.gate_proj.weight": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.13.gate_proj.weight_scale": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.13.up_proj.weight": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.13.up_proj.weight_scale": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.130.down_proj.weight": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.130.down_proj.weight_scale": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.130.gate_proj.weight": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.130.gate_proj.weight_scale": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.130.up_proj.weight": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.130.up_proj.weight_scale": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.131.down_proj.weight": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.131.down_proj.weight_scale": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.131.gate_proj.weight": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.131.gate_proj.weight_scale": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.131.up_proj.weight": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.131.up_proj.weight_scale": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.132.down_proj.weight": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.132.down_proj.weight_scale": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.132.gate_proj.weight": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.132.gate_proj.weight_scale": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.132.up_proj.weight": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.132.up_proj.weight_scale": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.133.down_proj.weight": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.133.down_proj.weight_scale": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.133.gate_proj.weight": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.133.gate_proj.weight_scale": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.133.up_proj.weight": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.133.up_proj.weight_scale": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.134.down_proj.weight": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.134.down_proj.weight_scale": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.134.gate_proj.weight": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.134.gate_proj.weight_scale": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.134.up_proj.weight": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.134.up_proj.weight_scale": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.135.down_proj.weight": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.135.down_proj.weight_scale": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.135.gate_proj.weight": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.135.gate_proj.weight_scale": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.135.up_proj.weight": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.135.up_proj.weight_scale": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.136.down_proj.weight": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.136.down_proj.weight_scale": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.136.gate_proj.weight": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.136.gate_proj.weight_scale": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.136.up_proj.weight": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.136.up_proj.weight_scale": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.137.down_proj.weight": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.137.down_proj.weight_scale": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.137.gate_proj.weight": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.137.gate_proj.weight_scale": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.137.up_proj.weight": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.137.up_proj.weight_scale": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.138.down_proj.weight": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.138.down_proj.weight_scale": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.138.gate_proj.weight": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.138.gate_proj.weight_scale": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.138.up_proj.weight": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.138.up_proj.weight_scale": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.139.down_proj.weight": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.139.down_proj.weight_scale": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.139.gate_proj.weight": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.139.gate_proj.weight_scale": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.139.up_proj.weight": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.139.up_proj.weight_scale": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.14.down_proj.weight": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.14.down_proj.weight_scale": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.14.gate_proj.weight": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.14.gate_proj.weight_scale": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.14.up_proj.weight": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.14.up_proj.weight_scale": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.140.down_proj.weight": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.140.down_proj.weight_scale": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.140.gate_proj.weight": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.140.gate_proj.weight_scale": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.140.up_proj.weight": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.140.up_proj.weight_scale": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.141.down_proj.weight": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.141.down_proj.weight_scale": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.141.gate_proj.weight": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.141.gate_proj.weight_scale": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.141.up_proj.weight": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.141.up_proj.weight_scale": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.142.down_proj.weight": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.142.down_proj.weight_scale": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.142.gate_proj.weight": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.142.gate_proj.weight_scale": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.142.up_proj.weight": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.142.up_proj.weight_scale": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.143.down_proj.weight": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.143.down_proj.weight_scale": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.143.gate_proj.weight": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.143.gate_proj.weight_scale": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.143.up_proj.weight": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.143.up_proj.weight_scale": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.144.down_proj.weight": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.144.down_proj.weight_scale": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.144.gate_proj.weight": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.144.gate_proj.weight_scale": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.144.up_proj.weight": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.144.up_proj.weight_scale": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.145.down_proj.weight": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.145.down_proj.weight_scale": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.145.gate_proj.weight": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.145.gate_proj.weight_scale": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.145.up_proj.weight": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.145.up_proj.weight_scale": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.146.down_proj.weight": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.146.down_proj.weight_scale": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.146.gate_proj.weight": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.146.gate_proj.weight_scale": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.146.up_proj.weight": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.146.up_proj.weight_scale": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.147.down_proj.weight": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.147.down_proj.weight_scale": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.147.gate_proj.weight": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.147.gate_proj.weight_scale": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.147.up_proj.weight": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.147.up_proj.weight_scale": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.148.down_proj.weight": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.148.down_proj.weight_scale": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.148.gate_proj.weight": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.148.gate_proj.weight_scale": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.148.up_proj.weight": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.148.up_proj.weight_scale": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.149.down_proj.weight": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.149.down_proj.weight_scale": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.149.gate_proj.weight": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.149.gate_proj.weight_scale": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.149.up_proj.weight": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.149.up_proj.weight_scale": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.15.down_proj.weight": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.15.down_proj.weight_scale": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.15.gate_proj.weight": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.15.gate_proj.weight_scale": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.15.up_proj.weight": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.15.up_proj.weight_scale": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.150.down_proj.weight": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.150.down_proj.weight_scale": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.150.gate_proj.weight": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.150.gate_proj.weight_scale": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.150.up_proj.weight": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.150.up_proj.weight_scale": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.151.down_proj.weight": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.151.down_proj.weight_scale": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.151.gate_proj.weight": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.151.gate_proj.weight_scale": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.151.up_proj.weight": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.151.up_proj.weight_scale": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.152.down_proj.weight": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.152.down_proj.weight_scale": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.152.gate_proj.weight": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.152.gate_proj.weight_scale": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.152.up_proj.weight": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.152.up_proj.weight_scale": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.153.down_proj.weight": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.153.down_proj.weight_scale": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.153.gate_proj.weight": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.153.gate_proj.weight_scale": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.153.up_proj.weight": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.153.up_proj.weight_scale": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.154.down_proj.weight": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.154.down_proj.weight_scale": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.154.gate_proj.weight": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.154.gate_proj.weight_scale": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.154.up_proj.weight": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.154.up_proj.weight_scale": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.155.down_proj.weight": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.155.down_proj.weight_scale": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.155.gate_proj.weight": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.155.gate_proj.weight_scale": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.155.up_proj.weight": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.155.up_proj.weight_scale": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.156.down_proj.weight": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.156.down_proj.weight_scale": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.156.gate_proj.weight": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.156.gate_proj.weight_scale": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.156.up_proj.weight": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.156.up_proj.weight_scale": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.157.down_proj.weight": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.157.down_proj.weight_scale": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.157.gate_proj.weight": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.157.gate_proj.weight_scale": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.157.up_proj.weight": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.157.up_proj.weight_scale": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.158.down_proj.weight": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.158.down_proj.weight_scale": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.158.gate_proj.weight": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.158.gate_proj.weight_scale": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.158.up_proj.weight": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.158.up_proj.weight_scale": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.159.down_proj.weight": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.159.down_proj.weight_scale": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.159.gate_proj.weight": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.159.gate_proj.weight_scale": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.159.up_proj.weight": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.159.up_proj.weight_scale": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.16.down_proj.weight": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.16.down_proj.weight_scale": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.16.gate_proj.weight": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.16.gate_proj.weight_scale": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.16.up_proj.weight": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.16.up_proj.weight_scale": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.17.down_proj.weight": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.17.down_proj.weight_scale": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.17.gate_proj.weight": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.17.gate_proj.weight_scale": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.17.up_proj.weight": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.17.up_proj.weight_scale": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.18.down_proj.weight": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.18.down_proj.weight_scale": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.18.gate_proj.weight": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.18.gate_proj.weight_scale": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.18.up_proj.weight": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.18.up_proj.weight_scale": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.19.down_proj.weight": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.19.down_proj.weight_scale": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.19.gate_proj.weight": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.19.gate_proj.weight_scale": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.19.up_proj.weight": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.19.up_proj.weight_scale": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.2.down_proj.weight": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.2.down_proj.weight_scale": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.2.gate_proj.weight": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.2.gate_proj.weight_scale": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.2.up_proj.weight": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.2.up_proj.weight_scale": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.20.down_proj.weight": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.20.down_proj.weight_scale": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.20.gate_proj.weight": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.20.gate_proj.weight_scale": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.20.up_proj.weight": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.20.up_proj.weight_scale": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.21.down_proj.weight": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.21.down_proj.weight_scale": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.21.gate_proj.weight": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.21.gate_proj.weight_scale": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.21.up_proj.weight": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.21.up_proj.weight_scale": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.22.down_proj.weight": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.22.down_proj.weight_scale": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.22.gate_proj.weight": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.22.gate_proj.weight_scale": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.22.up_proj.weight": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.22.up_proj.weight_scale": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.23.down_proj.weight": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.23.down_proj.weight_scale": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.23.gate_proj.weight": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.23.gate_proj.weight_scale": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.23.up_proj.weight": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.23.up_proj.weight_scale": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.24.down_proj.weight": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.24.down_proj.weight_scale": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.24.gate_proj.weight": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.24.gate_proj.weight_scale": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.24.up_proj.weight": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.24.up_proj.weight_scale": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.25.down_proj.weight": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.25.down_proj.weight_scale": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.25.gate_proj.weight": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.25.gate_proj.weight_scale": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.25.up_proj.weight": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.25.up_proj.weight_scale": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.26.down_proj.weight": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.26.down_proj.weight_scale": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.26.gate_proj.weight": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.26.gate_proj.weight_scale": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.26.up_proj.weight": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.26.up_proj.weight_scale": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.27.down_proj.weight": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.27.down_proj.weight_scale": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.27.gate_proj.weight": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.27.gate_proj.weight_scale": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.27.up_proj.weight": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.27.up_proj.weight_scale": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.28.down_proj.weight": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.28.down_proj.weight_scale": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.28.gate_proj.weight": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.28.gate_proj.weight_scale": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.28.up_proj.weight": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.28.up_proj.weight_scale": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.29.down_proj.weight": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.29.down_proj.weight_scale": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.29.gate_proj.weight": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.29.gate_proj.weight_scale": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.29.up_proj.weight": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.29.up_proj.weight_scale": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.3.down_proj.weight": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.3.down_proj.weight_scale": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.3.gate_proj.weight": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.3.gate_proj.weight_scale": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.3.up_proj.weight": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.3.up_proj.weight_scale": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.30.down_proj.weight": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.30.down_proj.weight_scale": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.30.gate_proj.weight": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.30.gate_proj.weight_scale": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.30.up_proj.weight": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.30.up_proj.weight_scale": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.31.down_proj.weight": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.31.down_proj.weight_scale": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.31.gate_proj.weight": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.31.gate_proj.weight_scale": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.31.up_proj.weight": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.31.up_proj.weight_scale": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.32.down_proj.weight": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.32.down_proj.weight_scale": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.32.gate_proj.weight": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.32.gate_proj.weight_scale": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.32.up_proj.weight": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.32.up_proj.weight_scale": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.33.down_proj.weight": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.33.down_proj.weight_scale": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.33.gate_proj.weight": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.33.gate_proj.weight_scale": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.33.up_proj.weight": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.33.up_proj.weight_scale": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.34.down_proj.weight": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.34.down_proj.weight_scale": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.34.gate_proj.weight": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.34.gate_proj.weight_scale": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.34.up_proj.weight": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.34.up_proj.weight_scale": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.35.down_proj.weight": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.35.down_proj.weight_scale": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.35.gate_proj.weight": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.35.gate_proj.weight_scale": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.35.up_proj.weight": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.35.up_proj.weight_scale": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.36.down_proj.weight": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.36.down_proj.weight_scale": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.36.gate_proj.weight": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.36.gate_proj.weight_scale": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.36.up_proj.weight": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.36.up_proj.weight_scale": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.37.down_proj.weight": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.37.down_proj.weight_scale": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.37.gate_proj.weight": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.37.gate_proj.weight_scale": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.37.up_proj.weight": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.37.up_proj.weight_scale": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.38.down_proj.weight": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.38.down_proj.weight_scale": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.38.gate_proj.weight": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.38.gate_proj.weight_scale": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.38.up_proj.weight": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.38.up_proj.weight_scale": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.39.down_proj.weight": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.39.down_proj.weight_scale": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.39.gate_proj.weight": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.39.gate_proj.weight_scale": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.39.up_proj.weight": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.39.up_proj.weight_scale": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.4.down_proj.weight": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.4.down_proj.weight_scale": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.4.gate_proj.weight": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.4.gate_proj.weight_scale": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.4.up_proj.weight": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.4.up_proj.weight_scale": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.40.down_proj.weight": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.40.down_proj.weight_scale": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.40.gate_proj.weight": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.40.gate_proj.weight_scale": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.40.up_proj.weight": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.40.up_proj.weight_scale": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.41.down_proj.weight": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.41.down_proj.weight_scale": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.41.gate_proj.weight": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.41.gate_proj.weight_scale": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.41.up_proj.weight": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.41.up_proj.weight_scale": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.42.down_proj.weight": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.42.down_proj.weight_scale": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.42.gate_proj.weight": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.42.gate_proj.weight_scale": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.42.up_proj.weight": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.42.up_proj.weight_scale": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.43.down_proj.weight": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.43.down_proj.weight_scale": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.43.gate_proj.weight": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.43.gate_proj.weight_scale": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.43.up_proj.weight": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.43.up_proj.weight_scale": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.44.down_proj.weight": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.44.down_proj.weight_scale": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.44.gate_proj.weight": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.44.gate_proj.weight_scale": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.44.up_proj.weight": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.44.up_proj.weight_scale": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.45.down_proj.weight": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.45.down_proj.weight_scale": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.45.gate_proj.weight": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.45.gate_proj.weight_scale": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.45.up_proj.weight": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.45.up_proj.weight_scale": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.46.down_proj.weight": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.46.down_proj.weight_scale": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.46.gate_proj.weight": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.46.gate_proj.weight_scale": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.46.up_proj.weight": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.46.up_proj.weight_scale": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.47.down_proj.weight": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.47.down_proj.weight_scale": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.47.gate_proj.weight": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.47.gate_proj.weight_scale": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.47.up_proj.weight": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.47.up_proj.weight_scale": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.48.down_proj.weight": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.48.down_proj.weight_scale": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.48.gate_proj.weight": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.48.gate_proj.weight_scale": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.48.up_proj.weight": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.48.up_proj.weight_scale": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.49.down_proj.weight": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.49.down_proj.weight_scale": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.49.gate_proj.weight": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.49.gate_proj.weight_scale": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.49.up_proj.weight": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.49.up_proj.weight_scale": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.5.down_proj.weight": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.5.down_proj.weight_scale": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.5.gate_proj.weight": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.5.gate_proj.weight_scale": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.5.up_proj.weight": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.5.up_proj.weight_scale": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.50.down_proj.weight": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.50.down_proj.weight_scale": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.50.gate_proj.weight": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.50.gate_proj.weight_scale": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.50.up_proj.weight": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.50.up_proj.weight_scale": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.51.down_proj.weight": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.51.down_proj.weight_scale": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.51.gate_proj.weight": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.51.gate_proj.weight_scale": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.51.up_proj.weight": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.51.up_proj.weight_scale": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.52.down_proj.weight": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.52.down_proj.weight_scale": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.52.gate_proj.weight": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.52.gate_proj.weight_scale": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.52.up_proj.weight": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.52.up_proj.weight_scale": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.53.down_proj.weight": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.53.down_proj.weight_scale": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.53.gate_proj.weight": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.53.gate_proj.weight_scale": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.53.up_proj.weight": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.53.up_proj.weight_scale": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.54.down_proj.weight": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.54.down_proj.weight_scale": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.54.gate_proj.weight": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.54.gate_proj.weight_scale": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.54.up_proj.weight": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.54.up_proj.weight_scale": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.55.down_proj.weight": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.55.down_proj.weight_scale": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.55.gate_proj.weight": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.55.gate_proj.weight_scale": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.55.up_proj.weight": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.55.up_proj.weight_scale": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.56.down_proj.weight": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.56.down_proj.weight_scale": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.56.gate_proj.weight": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.56.gate_proj.weight_scale": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.56.up_proj.weight": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.56.up_proj.weight_scale": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.57.down_proj.weight": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.57.down_proj.weight_scale": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.57.gate_proj.weight": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.57.gate_proj.weight_scale": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.57.up_proj.weight": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.57.up_proj.weight_scale": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.58.down_proj.weight": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.58.down_proj.weight_scale": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.58.gate_proj.weight": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.58.gate_proj.weight_scale": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.58.up_proj.weight": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.58.up_proj.weight_scale": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.59.down_proj.weight": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.59.down_proj.weight_scale": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.59.gate_proj.weight": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.59.gate_proj.weight_scale": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.59.up_proj.weight": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.59.up_proj.weight_scale": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.6.down_proj.weight": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.6.down_proj.weight_scale": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.6.gate_proj.weight": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.6.gate_proj.weight_scale": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.6.up_proj.weight": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.6.up_proj.weight_scale": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.60.down_proj.weight": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.60.down_proj.weight_scale": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.60.gate_proj.weight": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.60.gate_proj.weight_scale": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.60.up_proj.weight": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.60.up_proj.weight_scale": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.61.down_proj.weight": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.61.down_proj.weight_scale": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.61.gate_proj.weight": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.61.gate_proj.weight_scale": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.61.up_proj.weight": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.61.up_proj.weight_scale": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.62.down_proj.weight": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.62.down_proj.weight_scale": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.62.gate_proj.weight": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.62.gate_proj.weight_scale": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.62.up_proj.weight": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.62.up_proj.weight_scale": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.63.down_proj.weight": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.63.down_proj.weight_scale": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.63.gate_proj.weight": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.63.gate_proj.weight_scale": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.63.up_proj.weight": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.63.up_proj.weight_scale": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.64.down_proj.weight": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.64.down_proj.weight_scale": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.64.gate_proj.weight": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.64.gate_proj.weight_scale": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.64.up_proj.weight": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.64.up_proj.weight_scale": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.65.down_proj.weight": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.65.down_proj.weight_scale": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.65.gate_proj.weight": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.65.gate_proj.weight_scale": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.65.up_proj.weight": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.65.up_proj.weight_scale": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.66.down_proj.weight": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.66.down_proj.weight_scale": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.66.gate_proj.weight": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.66.gate_proj.weight_scale": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.66.up_proj.weight": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.66.up_proj.weight_scale": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.67.down_proj.weight": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.67.down_proj.weight_scale": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.67.gate_proj.weight": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.67.gate_proj.weight_scale": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.67.up_proj.weight": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.67.up_proj.weight_scale": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.68.down_proj.weight": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.68.down_proj.weight_scale": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.68.gate_proj.weight": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.68.gate_proj.weight_scale": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.68.up_proj.weight": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.68.up_proj.weight_scale": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.69.down_proj.weight": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.69.down_proj.weight_scale": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.69.gate_proj.weight": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.69.gate_proj.weight_scale": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.69.up_proj.weight": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.69.up_proj.weight_scale": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.7.down_proj.weight": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.7.down_proj.weight_scale": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.7.gate_proj.weight": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.7.gate_proj.weight_scale": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.7.up_proj.weight": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.7.up_proj.weight_scale": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.70.down_proj.weight": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.70.down_proj.weight_scale": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.70.gate_proj.weight": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.70.gate_proj.weight_scale": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.70.up_proj.weight": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.70.up_proj.weight_scale": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.71.down_proj.weight": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.71.down_proj.weight_scale": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.71.gate_proj.weight": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.71.gate_proj.weight_scale": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.71.up_proj.weight": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.71.up_proj.weight_scale": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.72.down_proj.weight": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.72.down_proj.weight_scale": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.72.gate_proj.weight": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.72.gate_proj.weight_scale": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.72.up_proj.weight": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.72.up_proj.weight_scale": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.73.down_proj.weight": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.73.down_proj.weight_scale": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.73.gate_proj.weight": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.73.gate_proj.weight_scale": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.73.up_proj.weight": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.73.up_proj.weight_scale": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.74.down_proj.weight": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.74.down_proj.weight_scale": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.74.gate_proj.weight": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.74.gate_proj.weight_scale": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.74.up_proj.weight": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.74.up_proj.weight_scale": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.75.down_proj.weight": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.75.down_proj.weight_scale": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.75.gate_proj.weight": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.75.gate_proj.weight_scale": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.75.up_proj.weight": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.75.up_proj.weight_scale": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.76.down_proj.weight": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.76.down_proj.weight_scale": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.76.gate_proj.weight": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.76.gate_proj.weight_scale": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.76.up_proj.weight": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.76.up_proj.weight_scale": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.77.down_proj.weight": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.77.down_proj.weight_scale": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.77.gate_proj.weight": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.77.gate_proj.weight_scale": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.77.up_proj.weight": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.77.up_proj.weight_scale": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.78.down_proj.weight": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.78.down_proj.weight_scale": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.78.gate_proj.weight": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.78.gate_proj.weight_scale": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.78.up_proj.weight": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.78.up_proj.weight_scale": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.79.down_proj.weight": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.79.down_proj.weight_scale": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.79.gate_proj.weight": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.79.gate_proj.weight_scale": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.79.up_proj.weight": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.79.up_proj.weight_scale": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.8.down_proj.weight": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.8.down_proj.weight_scale": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.8.gate_proj.weight": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.8.gate_proj.weight_scale": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.8.up_proj.weight": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.8.up_proj.weight_scale": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.80.down_proj.weight": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.80.down_proj.weight_scale": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.80.gate_proj.weight": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.80.gate_proj.weight_scale": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.80.up_proj.weight": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.80.up_proj.weight_scale": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.81.down_proj.weight": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.81.down_proj.weight_scale": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.81.gate_proj.weight": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.81.gate_proj.weight_scale": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.81.up_proj.weight": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.81.up_proj.weight_scale": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.82.down_proj.weight": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.82.down_proj.weight_scale": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.82.gate_proj.weight": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.82.gate_proj.weight_scale": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.82.up_proj.weight": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.82.up_proj.weight_scale": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.83.down_proj.weight": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.83.down_proj.weight_scale": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.83.gate_proj.weight": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.83.gate_proj.weight_scale": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.83.up_proj.weight": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.83.up_proj.weight_scale": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.84.down_proj.weight": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.84.down_proj.weight_scale": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.84.gate_proj.weight": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.84.gate_proj.weight_scale": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.84.up_proj.weight": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.84.up_proj.weight_scale": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.85.down_proj.weight": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.85.down_proj.weight_scale": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.85.gate_proj.weight": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.85.gate_proj.weight_scale": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.85.up_proj.weight": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.85.up_proj.weight_scale": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.86.down_proj.weight": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.86.down_proj.weight_scale": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.86.gate_proj.weight": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.86.gate_proj.weight_scale": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.86.up_proj.weight": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.86.up_proj.weight_scale": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.87.down_proj.weight": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.87.down_proj.weight_scale": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.87.gate_proj.weight": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.87.gate_proj.weight_scale": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.87.up_proj.weight": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.87.up_proj.weight_scale": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.88.down_proj.weight": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.88.down_proj.weight_scale": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.88.gate_proj.weight": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.88.gate_proj.weight_scale": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.88.up_proj.weight": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.88.up_proj.weight_scale": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.89.down_proj.weight": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.89.down_proj.weight_scale": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.89.gate_proj.weight": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.89.gate_proj.weight_scale": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.89.up_proj.weight": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.89.up_proj.weight_scale": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.9.down_proj.weight": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.9.down_proj.weight_scale": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.9.gate_proj.weight": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.9.gate_proj.weight_scale": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.9.up_proj.weight": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.9.up_proj.weight_scale": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.90.down_proj.weight": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.90.down_proj.weight_scale": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.90.gate_proj.weight": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.90.gate_proj.weight_scale": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.90.up_proj.weight": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.90.up_proj.weight_scale": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.91.down_proj.weight": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.91.down_proj.weight_scale": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.91.gate_proj.weight": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.91.gate_proj.weight_scale": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.91.up_proj.weight": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.91.up_proj.weight_scale": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.92.down_proj.weight": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.92.down_proj.weight_scale": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.92.gate_proj.weight": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.92.gate_proj.weight_scale": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.92.up_proj.weight": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.92.up_proj.weight_scale": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.93.down_proj.weight": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.93.down_proj.weight_scale": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.93.gate_proj.weight": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.93.gate_proj.weight_scale": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.93.up_proj.weight": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.93.up_proj.weight_scale": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.94.down_proj.weight": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.94.down_proj.weight_scale": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.94.gate_proj.weight": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.94.gate_proj.weight_scale": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.94.up_proj.weight": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.94.up_proj.weight_scale": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.95.down_proj.weight": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.95.down_proj.weight_scale": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.95.gate_proj.weight": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.95.gate_proj.weight_scale": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.95.up_proj.weight": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.95.up_proj.weight_scale": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.96.down_proj.weight": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.96.down_proj.weight_scale": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.96.gate_proj.weight": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.96.gate_proj.weight_scale": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.96.up_proj.weight": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.96.up_proj.weight_scale": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.97.down_proj.weight": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.97.down_proj.weight_scale": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.97.gate_proj.weight": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.97.gate_proj.weight_scale": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.97.up_proj.weight": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.97.up_proj.weight_scale": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.98.down_proj.weight": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.98.down_proj.weight_scale": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.98.gate_proj.weight": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.98.gate_proj.weight_scale": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.98.up_proj.weight": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.98.up_proj.weight_scale": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.99.down_proj.weight": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.99.down_proj.weight_scale": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.99.gate_proj.weight": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.99.gate_proj.weight_scale": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.99.up_proj.weight": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.99.up_proj.weight_scale": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.gate.e_score_correction_bias": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.gate.weight": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.shared_experts.down_proj.weight": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.shared_experts.down_proj.weight_scale": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.shared_experts.gate_proj.weight": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.shared_experts.gate_proj.weight_scale": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.shared_experts.up_proj.weight": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.shared_experts.up_proj.weight_scale": "model-00049-of-00092.safetensors",
+ "model.layers.48.post_attention_layernorm.weight": "model-00049-of-00092.safetensors",
+ "model.layers.48.self_attn.k_norm.weight": "model-00049-of-00092.safetensors",
+ "model.layers.48.self_attn.k_proj.bias": "model-00049-of-00092.safetensors",
+ "model.layers.48.self_attn.k_proj.weight": "model-00049-of-00092.safetensors",
+ "model.layers.48.self_attn.k_proj.weight_scale": "model-00049-of-00092.safetensors",
+ "model.layers.48.self_attn.o_proj.weight": "model-00049-of-00092.safetensors",
+ "model.layers.48.self_attn.o_proj.weight_scale": "model-00049-of-00092.safetensors",
+ "model.layers.48.self_attn.q_norm.weight": "model-00049-of-00092.safetensors",
+ "model.layers.48.self_attn.q_proj.bias": "model-00049-of-00092.safetensors",
+ "model.layers.48.self_attn.q_proj.weight": "model-00049-of-00092.safetensors",
+ "model.layers.48.self_attn.q_proj.weight_scale": "model-00049-of-00092.safetensors",
+ "model.layers.48.self_attn.v_proj.bias": "model-00049-of-00092.safetensors",
+ "model.layers.48.self_attn.v_proj.weight": "model-00049-of-00092.safetensors",
+ "model.layers.48.self_attn.v_proj.weight_scale": "model-00049-of-00092.safetensors",
+ "model.layers.49.input_layernorm.weight": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.0.down_proj.weight": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.0.down_proj.weight_scale": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.0.gate_proj.weight": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.0.gate_proj.weight_scale": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.0.up_proj.weight": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.0.up_proj.weight_scale": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.1.down_proj.weight": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.1.down_proj.weight_scale": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.1.gate_proj.weight": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.1.gate_proj.weight_scale": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.1.up_proj.weight": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.1.up_proj.weight_scale": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.10.down_proj.weight": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.10.down_proj.weight_scale": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.10.gate_proj.weight": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.10.gate_proj.weight_scale": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.10.up_proj.weight": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.10.up_proj.weight_scale": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.100.down_proj.weight": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.100.down_proj.weight_scale": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.100.gate_proj.weight": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.100.gate_proj.weight_scale": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.100.up_proj.weight": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.100.up_proj.weight_scale": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.101.down_proj.weight": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.101.down_proj.weight_scale": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.101.gate_proj.weight": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.101.gate_proj.weight_scale": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.101.up_proj.weight": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.101.up_proj.weight_scale": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.102.down_proj.weight": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.102.down_proj.weight_scale": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.102.gate_proj.weight": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.102.gate_proj.weight_scale": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.102.up_proj.weight": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.102.up_proj.weight_scale": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.103.down_proj.weight": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.103.down_proj.weight_scale": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.103.gate_proj.weight": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.103.gate_proj.weight_scale": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.103.up_proj.weight": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.103.up_proj.weight_scale": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.104.down_proj.weight": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.104.down_proj.weight_scale": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.104.gate_proj.weight": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.104.gate_proj.weight_scale": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.104.up_proj.weight": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.104.up_proj.weight_scale": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.105.down_proj.weight": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.105.down_proj.weight_scale": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.105.gate_proj.weight": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.105.gate_proj.weight_scale": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.105.up_proj.weight": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.105.up_proj.weight_scale": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.106.down_proj.weight": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.106.down_proj.weight_scale": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.106.gate_proj.weight": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.106.gate_proj.weight_scale": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.106.up_proj.weight": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.106.up_proj.weight_scale": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.107.down_proj.weight": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.107.down_proj.weight_scale": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.107.gate_proj.weight": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.107.gate_proj.weight_scale": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.107.up_proj.weight": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.107.up_proj.weight_scale": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.108.down_proj.weight": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.108.down_proj.weight_scale": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.108.gate_proj.weight": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.108.gate_proj.weight_scale": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.108.up_proj.weight": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.108.up_proj.weight_scale": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.109.down_proj.weight": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.109.down_proj.weight_scale": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.109.gate_proj.weight": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.109.gate_proj.weight_scale": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.109.up_proj.weight": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.109.up_proj.weight_scale": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.11.down_proj.weight": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.11.down_proj.weight_scale": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.11.gate_proj.weight": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.11.gate_proj.weight_scale": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.11.up_proj.weight": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.11.up_proj.weight_scale": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.110.down_proj.weight": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.110.down_proj.weight_scale": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.110.gate_proj.weight": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.110.gate_proj.weight_scale": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.110.up_proj.weight": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.110.up_proj.weight_scale": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.111.down_proj.weight": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.111.down_proj.weight_scale": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.111.gate_proj.weight": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.111.gate_proj.weight_scale": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.111.up_proj.weight": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.111.up_proj.weight_scale": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.112.down_proj.weight": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.112.down_proj.weight_scale": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.112.gate_proj.weight": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.112.gate_proj.weight_scale": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.112.up_proj.weight": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.112.up_proj.weight_scale": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.113.down_proj.weight": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.113.down_proj.weight_scale": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.113.gate_proj.weight": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.113.gate_proj.weight_scale": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.113.up_proj.weight": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.113.up_proj.weight_scale": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.114.down_proj.weight": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.114.down_proj.weight_scale": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.114.gate_proj.weight": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.114.gate_proj.weight_scale": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.114.up_proj.weight": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.114.up_proj.weight_scale": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.115.down_proj.weight": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.115.down_proj.weight_scale": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.115.gate_proj.weight": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.115.gate_proj.weight_scale": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.115.up_proj.weight": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.115.up_proj.weight_scale": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.116.down_proj.weight": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.116.down_proj.weight_scale": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.116.gate_proj.weight": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.116.gate_proj.weight_scale": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.116.up_proj.weight": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.116.up_proj.weight_scale": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.117.down_proj.weight": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.117.down_proj.weight_scale": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.117.gate_proj.weight": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.117.gate_proj.weight_scale": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.117.up_proj.weight": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.117.up_proj.weight_scale": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.118.down_proj.weight": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.118.down_proj.weight_scale": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.118.gate_proj.weight": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.118.gate_proj.weight_scale": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.118.up_proj.weight": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.118.up_proj.weight_scale": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.119.down_proj.weight": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.119.down_proj.weight_scale": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.119.gate_proj.weight": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.119.gate_proj.weight_scale": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.119.up_proj.weight": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.119.up_proj.weight_scale": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.12.down_proj.weight": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.12.down_proj.weight_scale": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.12.gate_proj.weight": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.12.gate_proj.weight_scale": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.12.up_proj.weight": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.12.up_proj.weight_scale": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.120.down_proj.weight": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.120.down_proj.weight_scale": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.120.gate_proj.weight": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.120.gate_proj.weight_scale": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.120.up_proj.weight": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.120.up_proj.weight_scale": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.121.down_proj.weight": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.121.down_proj.weight_scale": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.121.gate_proj.weight": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.121.gate_proj.weight_scale": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.121.up_proj.weight": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.121.up_proj.weight_scale": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.122.down_proj.weight": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.122.down_proj.weight_scale": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.122.gate_proj.weight": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.122.gate_proj.weight_scale": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.122.up_proj.weight": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.122.up_proj.weight_scale": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.123.down_proj.weight": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.123.down_proj.weight_scale": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.123.gate_proj.weight": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.123.gate_proj.weight_scale": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.123.up_proj.weight": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.123.up_proj.weight_scale": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.124.down_proj.weight": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.124.down_proj.weight_scale": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.124.gate_proj.weight": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.124.gate_proj.weight_scale": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.124.up_proj.weight": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.124.up_proj.weight_scale": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.125.down_proj.weight": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.125.down_proj.weight_scale": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.125.gate_proj.weight": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.125.gate_proj.weight_scale": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.125.up_proj.weight": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.125.up_proj.weight_scale": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.126.down_proj.weight": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.126.down_proj.weight_scale": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.126.gate_proj.weight": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.126.gate_proj.weight_scale": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.126.up_proj.weight": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.126.up_proj.weight_scale": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.127.down_proj.weight": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.127.down_proj.weight_scale": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.127.gate_proj.weight": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.127.gate_proj.weight_scale": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.127.up_proj.weight": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.127.up_proj.weight_scale": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.128.down_proj.weight": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.128.down_proj.weight_scale": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.128.gate_proj.weight": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.128.gate_proj.weight_scale": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.128.up_proj.weight": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.128.up_proj.weight_scale": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.129.down_proj.weight": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.129.down_proj.weight_scale": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.129.gate_proj.weight": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.129.gate_proj.weight_scale": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.129.up_proj.weight": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.129.up_proj.weight_scale": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.13.down_proj.weight": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.13.down_proj.weight_scale": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.13.gate_proj.weight": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.13.gate_proj.weight_scale": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.13.up_proj.weight": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.13.up_proj.weight_scale": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.130.down_proj.weight": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.130.down_proj.weight_scale": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.130.gate_proj.weight": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.130.gate_proj.weight_scale": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.130.up_proj.weight": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.130.up_proj.weight_scale": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.131.down_proj.weight": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.131.down_proj.weight_scale": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.131.gate_proj.weight": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.131.gate_proj.weight_scale": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.131.up_proj.weight": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.131.up_proj.weight_scale": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.132.down_proj.weight": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.132.down_proj.weight_scale": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.132.gate_proj.weight": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.132.gate_proj.weight_scale": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.132.up_proj.weight": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.132.up_proj.weight_scale": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.133.down_proj.weight": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.133.down_proj.weight_scale": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.133.gate_proj.weight": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.133.gate_proj.weight_scale": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.133.up_proj.weight": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.133.up_proj.weight_scale": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.134.down_proj.weight": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.134.down_proj.weight_scale": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.134.gate_proj.weight": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.134.gate_proj.weight_scale": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.134.up_proj.weight": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.134.up_proj.weight_scale": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.135.down_proj.weight": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.135.down_proj.weight_scale": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.135.gate_proj.weight": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.135.gate_proj.weight_scale": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.135.up_proj.weight": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.135.up_proj.weight_scale": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.136.down_proj.weight": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.136.down_proj.weight_scale": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.136.gate_proj.weight": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.136.gate_proj.weight_scale": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.136.up_proj.weight": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.136.up_proj.weight_scale": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.137.down_proj.weight": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.137.down_proj.weight_scale": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.137.gate_proj.weight": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.137.gate_proj.weight_scale": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.137.up_proj.weight": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.137.up_proj.weight_scale": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.138.down_proj.weight": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.138.down_proj.weight_scale": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.138.gate_proj.weight": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.138.gate_proj.weight_scale": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.138.up_proj.weight": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.138.up_proj.weight_scale": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.139.down_proj.weight": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.139.down_proj.weight_scale": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.139.gate_proj.weight": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.139.gate_proj.weight_scale": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.139.up_proj.weight": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.139.up_proj.weight_scale": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.14.down_proj.weight": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.14.down_proj.weight_scale": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.14.gate_proj.weight": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.14.gate_proj.weight_scale": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.14.up_proj.weight": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.14.up_proj.weight_scale": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.140.down_proj.weight": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.140.down_proj.weight_scale": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.140.gate_proj.weight": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.140.gate_proj.weight_scale": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.140.up_proj.weight": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.140.up_proj.weight_scale": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.141.down_proj.weight": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.141.down_proj.weight_scale": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.141.gate_proj.weight": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.141.gate_proj.weight_scale": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.141.up_proj.weight": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.141.up_proj.weight_scale": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.142.down_proj.weight": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.142.down_proj.weight_scale": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.142.gate_proj.weight": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.142.gate_proj.weight_scale": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.142.up_proj.weight": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.142.up_proj.weight_scale": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.143.down_proj.weight": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.143.down_proj.weight_scale": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.143.gate_proj.weight": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.143.gate_proj.weight_scale": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.143.up_proj.weight": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.143.up_proj.weight_scale": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.144.down_proj.weight": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.144.down_proj.weight_scale": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.144.gate_proj.weight": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.144.gate_proj.weight_scale": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.144.up_proj.weight": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.144.up_proj.weight_scale": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.145.down_proj.weight": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.145.down_proj.weight_scale": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.145.gate_proj.weight": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.145.gate_proj.weight_scale": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.145.up_proj.weight": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.145.up_proj.weight_scale": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.146.down_proj.weight": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.146.down_proj.weight_scale": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.146.gate_proj.weight": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.146.gate_proj.weight_scale": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.146.up_proj.weight": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.146.up_proj.weight_scale": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.147.down_proj.weight": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.147.down_proj.weight_scale": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.147.gate_proj.weight": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.147.gate_proj.weight_scale": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.147.up_proj.weight": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.147.up_proj.weight_scale": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.148.down_proj.weight": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.148.down_proj.weight_scale": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.148.gate_proj.weight": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.148.gate_proj.weight_scale": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.148.up_proj.weight": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.148.up_proj.weight_scale": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.149.down_proj.weight": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.149.down_proj.weight_scale": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.149.gate_proj.weight": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.149.gate_proj.weight_scale": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.149.up_proj.weight": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.149.up_proj.weight_scale": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.15.down_proj.weight": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.15.down_proj.weight_scale": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.15.gate_proj.weight": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.15.gate_proj.weight_scale": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.15.up_proj.weight": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.15.up_proj.weight_scale": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.150.down_proj.weight": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.150.down_proj.weight_scale": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.150.gate_proj.weight": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.150.gate_proj.weight_scale": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.150.up_proj.weight": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.150.up_proj.weight_scale": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.151.down_proj.weight": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.151.down_proj.weight_scale": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.151.gate_proj.weight": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.151.gate_proj.weight_scale": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.151.up_proj.weight": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.151.up_proj.weight_scale": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.152.down_proj.weight": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.152.down_proj.weight_scale": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.152.gate_proj.weight": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.152.gate_proj.weight_scale": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.152.up_proj.weight": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.152.up_proj.weight_scale": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.153.down_proj.weight": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.153.down_proj.weight_scale": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.153.gate_proj.weight": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.153.gate_proj.weight_scale": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.153.up_proj.weight": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.153.up_proj.weight_scale": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.154.down_proj.weight": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.154.down_proj.weight_scale": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.154.gate_proj.weight": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.154.gate_proj.weight_scale": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.154.up_proj.weight": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.154.up_proj.weight_scale": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.155.down_proj.weight": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.155.down_proj.weight_scale": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.155.gate_proj.weight": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.155.gate_proj.weight_scale": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.155.up_proj.weight": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.155.up_proj.weight_scale": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.156.down_proj.weight": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.156.down_proj.weight_scale": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.156.gate_proj.weight": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.156.gate_proj.weight_scale": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.156.up_proj.weight": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.156.up_proj.weight_scale": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.157.down_proj.weight": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.157.down_proj.weight_scale": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.157.gate_proj.weight": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.157.gate_proj.weight_scale": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.157.up_proj.weight": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.157.up_proj.weight_scale": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.158.down_proj.weight": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.158.down_proj.weight_scale": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.158.gate_proj.weight": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.158.gate_proj.weight_scale": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.158.up_proj.weight": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.158.up_proj.weight_scale": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.159.down_proj.weight": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.159.down_proj.weight_scale": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.159.gate_proj.weight": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.159.gate_proj.weight_scale": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.159.up_proj.weight": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.159.up_proj.weight_scale": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.16.down_proj.weight": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.16.down_proj.weight_scale": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.16.gate_proj.weight": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.16.gate_proj.weight_scale": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.16.up_proj.weight": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.16.up_proj.weight_scale": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.17.down_proj.weight": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.17.down_proj.weight_scale": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.17.gate_proj.weight": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.17.gate_proj.weight_scale": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.17.up_proj.weight": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.17.up_proj.weight_scale": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.18.down_proj.weight": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.18.down_proj.weight_scale": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.18.gate_proj.weight": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.18.gate_proj.weight_scale": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.18.up_proj.weight": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.18.up_proj.weight_scale": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.19.down_proj.weight": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.19.down_proj.weight_scale": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.19.gate_proj.weight": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.19.gate_proj.weight_scale": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.19.up_proj.weight": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.19.up_proj.weight_scale": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.2.down_proj.weight": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.2.down_proj.weight_scale": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.2.gate_proj.weight": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.2.gate_proj.weight_scale": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.2.up_proj.weight": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.2.up_proj.weight_scale": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.20.down_proj.weight": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.20.down_proj.weight_scale": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.20.gate_proj.weight": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.20.gate_proj.weight_scale": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.20.up_proj.weight": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.20.up_proj.weight_scale": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.21.down_proj.weight": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.21.down_proj.weight_scale": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.21.gate_proj.weight": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.21.gate_proj.weight_scale": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.21.up_proj.weight": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.21.up_proj.weight_scale": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.22.down_proj.weight": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.22.down_proj.weight_scale": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.22.gate_proj.weight": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.22.gate_proj.weight_scale": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.22.up_proj.weight": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.22.up_proj.weight_scale": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.23.down_proj.weight": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.23.down_proj.weight_scale": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.23.gate_proj.weight": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.23.gate_proj.weight_scale": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.23.up_proj.weight": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.23.up_proj.weight_scale": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.24.down_proj.weight": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.24.down_proj.weight_scale": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.24.gate_proj.weight": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.24.gate_proj.weight_scale": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.24.up_proj.weight": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.24.up_proj.weight_scale": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.25.down_proj.weight": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.25.down_proj.weight_scale": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.25.gate_proj.weight": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.25.gate_proj.weight_scale": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.25.up_proj.weight": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.25.up_proj.weight_scale": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.26.down_proj.weight": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.26.down_proj.weight_scale": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.26.gate_proj.weight": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.26.gate_proj.weight_scale": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.26.up_proj.weight": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.26.up_proj.weight_scale": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.27.down_proj.weight": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.27.down_proj.weight_scale": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.27.gate_proj.weight": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.27.gate_proj.weight_scale": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.27.up_proj.weight": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.27.up_proj.weight_scale": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.28.down_proj.weight": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.28.down_proj.weight_scale": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.28.gate_proj.weight": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.28.gate_proj.weight_scale": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.28.up_proj.weight": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.28.up_proj.weight_scale": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.29.down_proj.weight": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.29.down_proj.weight_scale": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.29.gate_proj.weight": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.29.gate_proj.weight_scale": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.29.up_proj.weight": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.29.up_proj.weight_scale": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.3.down_proj.weight": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.3.down_proj.weight_scale": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.3.gate_proj.weight": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.3.gate_proj.weight_scale": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.3.up_proj.weight": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.3.up_proj.weight_scale": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.30.down_proj.weight": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.30.down_proj.weight_scale": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.30.gate_proj.weight": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.30.gate_proj.weight_scale": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.30.up_proj.weight": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.30.up_proj.weight_scale": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.31.down_proj.weight": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.31.down_proj.weight_scale": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.31.gate_proj.weight": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.31.gate_proj.weight_scale": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.31.up_proj.weight": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.31.up_proj.weight_scale": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.32.down_proj.weight": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.32.down_proj.weight_scale": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.32.gate_proj.weight": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.32.gate_proj.weight_scale": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.32.up_proj.weight": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.32.up_proj.weight_scale": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.33.down_proj.weight": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.33.down_proj.weight_scale": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.33.gate_proj.weight": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.33.gate_proj.weight_scale": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.33.up_proj.weight": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.33.up_proj.weight_scale": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.34.down_proj.weight": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.34.down_proj.weight_scale": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.34.gate_proj.weight": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.34.gate_proj.weight_scale": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.34.up_proj.weight": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.34.up_proj.weight_scale": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.35.down_proj.weight": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.35.down_proj.weight_scale": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.35.gate_proj.weight": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.35.gate_proj.weight_scale": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.35.up_proj.weight": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.35.up_proj.weight_scale": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.36.down_proj.weight": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.36.down_proj.weight_scale": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.36.gate_proj.weight": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.36.gate_proj.weight_scale": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.36.up_proj.weight": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.36.up_proj.weight_scale": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.37.down_proj.weight": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.37.down_proj.weight_scale": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.37.gate_proj.weight": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.37.gate_proj.weight_scale": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.37.up_proj.weight": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.37.up_proj.weight_scale": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.38.down_proj.weight": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.38.down_proj.weight_scale": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.38.gate_proj.weight": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.38.gate_proj.weight_scale": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.38.up_proj.weight": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.38.up_proj.weight_scale": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.39.down_proj.weight": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.39.down_proj.weight_scale": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.39.gate_proj.weight": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.39.gate_proj.weight_scale": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.39.up_proj.weight": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.39.up_proj.weight_scale": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.4.down_proj.weight": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.4.down_proj.weight_scale": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.4.gate_proj.weight": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.4.gate_proj.weight_scale": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.4.up_proj.weight": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.4.up_proj.weight_scale": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.40.down_proj.weight": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.40.down_proj.weight_scale": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.40.gate_proj.weight": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.40.gate_proj.weight_scale": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.40.up_proj.weight": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.40.up_proj.weight_scale": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.41.down_proj.weight": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.41.down_proj.weight_scale": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.41.gate_proj.weight": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.41.gate_proj.weight_scale": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.41.up_proj.weight": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.41.up_proj.weight_scale": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.42.down_proj.weight": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.42.down_proj.weight_scale": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.42.gate_proj.weight": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.42.gate_proj.weight_scale": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.42.up_proj.weight": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.42.up_proj.weight_scale": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.43.down_proj.weight": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.43.down_proj.weight_scale": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.43.gate_proj.weight": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.43.gate_proj.weight_scale": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.43.up_proj.weight": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.43.up_proj.weight_scale": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.44.down_proj.weight": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.44.down_proj.weight_scale": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.44.gate_proj.weight": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.44.gate_proj.weight_scale": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.44.up_proj.weight": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.44.up_proj.weight_scale": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.45.down_proj.weight": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.45.down_proj.weight_scale": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.45.gate_proj.weight": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.45.gate_proj.weight_scale": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.45.up_proj.weight": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.45.up_proj.weight_scale": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.46.down_proj.weight": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.46.down_proj.weight_scale": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.46.gate_proj.weight": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.46.gate_proj.weight_scale": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.46.up_proj.weight": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.46.up_proj.weight_scale": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.47.down_proj.weight": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.47.down_proj.weight_scale": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.47.gate_proj.weight": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.47.gate_proj.weight_scale": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.47.up_proj.weight": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.47.up_proj.weight_scale": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.48.down_proj.weight": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.48.down_proj.weight_scale": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.48.gate_proj.weight": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.48.gate_proj.weight_scale": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.48.up_proj.weight": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.48.up_proj.weight_scale": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.49.down_proj.weight": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.49.down_proj.weight_scale": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.49.gate_proj.weight": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.49.gate_proj.weight_scale": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.49.up_proj.weight": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.49.up_proj.weight_scale": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.5.down_proj.weight": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.5.down_proj.weight_scale": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.5.gate_proj.weight": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.5.gate_proj.weight_scale": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.5.up_proj.weight": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.5.up_proj.weight_scale": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.50.down_proj.weight": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.50.down_proj.weight_scale": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.50.gate_proj.weight": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.50.gate_proj.weight_scale": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.50.up_proj.weight": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.50.up_proj.weight_scale": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.51.down_proj.weight": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.51.down_proj.weight_scale": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.51.gate_proj.weight": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.51.gate_proj.weight_scale": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.51.up_proj.weight": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.51.up_proj.weight_scale": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.52.down_proj.weight": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.52.down_proj.weight_scale": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.52.gate_proj.weight": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.52.gate_proj.weight_scale": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.52.up_proj.weight": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.52.up_proj.weight_scale": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.53.down_proj.weight": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.53.down_proj.weight_scale": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.53.gate_proj.weight": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.53.gate_proj.weight_scale": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.53.up_proj.weight": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.53.up_proj.weight_scale": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.54.down_proj.weight": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.54.down_proj.weight_scale": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.54.gate_proj.weight": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.54.gate_proj.weight_scale": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.54.up_proj.weight": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.54.up_proj.weight_scale": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.55.down_proj.weight": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.55.down_proj.weight_scale": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.55.gate_proj.weight": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.55.gate_proj.weight_scale": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.55.up_proj.weight": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.55.up_proj.weight_scale": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.56.down_proj.weight": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.56.down_proj.weight_scale": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.56.gate_proj.weight": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.56.gate_proj.weight_scale": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.56.up_proj.weight": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.56.up_proj.weight_scale": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.57.down_proj.weight": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.57.down_proj.weight_scale": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.57.gate_proj.weight": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.57.gate_proj.weight_scale": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.57.up_proj.weight": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.57.up_proj.weight_scale": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.58.down_proj.weight": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.58.down_proj.weight_scale": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.58.gate_proj.weight": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.58.gate_proj.weight_scale": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.58.up_proj.weight": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.58.up_proj.weight_scale": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.59.down_proj.weight": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.59.down_proj.weight_scale": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.59.gate_proj.weight": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.59.gate_proj.weight_scale": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.59.up_proj.weight": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.59.up_proj.weight_scale": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.6.down_proj.weight": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.6.down_proj.weight_scale": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.6.gate_proj.weight": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.6.gate_proj.weight_scale": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.6.up_proj.weight": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.6.up_proj.weight_scale": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.60.down_proj.weight": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.60.down_proj.weight_scale": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.60.gate_proj.weight": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.60.gate_proj.weight_scale": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.60.up_proj.weight": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.60.up_proj.weight_scale": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.61.down_proj.weight": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.61.down_proj.weight_scale": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.61.gate_proj.weight": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.61.gate_proj.weight_scale": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.61.up_proj.weight": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.61.up_proj.weight_scale": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.62.down_proj.weight": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.62.down_proj.weight_scale": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.62.gate_proj.weight": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.62.gate_proj.weight_scale": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.62.up_proj.weight": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.62.up_proj.weight_scale": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.63.down_proj.weight": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.63.down_proj.weight_scale": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.63.gate_proj.weight": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.63.gate_proj.weight_scale": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.63.up_proj.weight": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.63.up_proj.weight_scale": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.64.down_proj.weight": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.64.down_proj.weight_scale": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.64.gate_proj.weight": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.64.gate_proj.weight_scale": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.64.up_proj.weight": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.64.up_proj.weight_scale": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.65.down_proj.weight": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.65.down_proj.weight_scale": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.65.gate_proj.weight": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.65.gate_proj.weight_scale": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.65.up_proj.weight": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.65.up_proj.weight_scale": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.66.down_proj.weight": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.66.down_proj.weight_scale": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.66.gate_proj.weight": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.66.gate_proj.weight_scale": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.66.up_proj.weight": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.66.up_proj.weight_scale": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.67.down_proj.weight": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.67.down_proj.weight_scale": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.67.gate_proj.weight": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.67.gate_proj.weight_scale": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.67.up_proj.weight": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.67.up_proj.weight_scale": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.68.down_proj.weight": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.68.down_proj.weight_scale": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.68.gate_proj.weight": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.68.gate_proj.weight_scale": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.68.up_proj.weight": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.68.up_proj.weight_scale": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.69.down_proj.weight": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.69.down_proj.weight_scale": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.69.gate_proj.weight": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.69.gate_proj.weight_scale": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.69.up_proj.weight": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.69.up_proj.weight_scale": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.7.down_proj.weight": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.7.down_proj.weight_scale": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.7.gate_proj.weight": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.7.gate_proj.weight_scale": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.7.up_proj.weight": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.7.up_proj.weight_scale": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.70.down_proj.weight": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.70.down_proj.weight_scale": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.70.gate_proj.weight": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.70.gate_proj.weight_scale": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.70.up_proj.weight": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.70.up_proj.weight_scale": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.71.down_proj.weight": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.71.down_proj.weight_scale": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.71.gate_proj.weight": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.71.gate_proj.weight_scale": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.71.up_proj.weight": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.71.up_proj.weight_scale": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.72.down_proj.weight": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.72.down_proj.weight_scale": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.72.gate_proj.weight": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.72.gate_proj.weight_scale": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.72.up_proj.weight": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.72.up_proj.weight_scale": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.73.down_proj.weight": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.73.down_proj.weight_scale": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.73.gate_proj.weight": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.73.gate_proj.weight_scale": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.73.up_proj.weight": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.73.up_proj.weight_scale": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.74.down_proj.weight": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.74.down_proj.weight_scale": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.74.gate_proj.weight": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.74.gate_proj.weight_scale": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.74.up_proj.weight": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.74.up_proj.weight_scale": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.75.down_proj.weight": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.75.down_proj.weight_scale": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.75.gate_proj.weight": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.75.gate_proj.weight_scale": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.75.up_proj.weight": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.75.up_proj.weight_scale": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.76.down_proj.weight": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.76.down_proj.weight_scale": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.76.gate_proj.weight": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.76.gate_proj.weight_scale": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.76.up_proj.weight": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.76.up_proj.weight_scale": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.77.down_proj.weight": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.77.down_proj.weight_scale": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.77.gate_proj.weight": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.77.gate_proj.weight_scale": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.77.up_proj.weight": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.77.up_proj.weight_scale": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.78.down_proj.weight": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.78.down_proj.weight_scale": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.78.gate_proj.weight": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.78.gate_proj.weight_scale": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.78.up_proj.weight": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.78.up_proj.weight_scale": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.79.down_proj.weight": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.79.down_proj.weight_scale": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.79.gate_proj.weight": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.79.gate_proj.weight_scale": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.79.up_proj.weight": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.79.up_proj.weight_scale": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.8.down_proj.weight": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.8.down_proj.weight_scale": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.8.gate_proj.weight": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.8.gate_proj.weight_scale": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.8.up_proj.weight": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.8.up_proj.weight_scale": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.80.down_proj.weight": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.80.down_proj.weight_scale": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.80.gate_proj.weight": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.80.gate_proj.weight_scale": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.80.up_proj.weight": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.80.up_proj.weight_scale": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.81.down_proj.weight": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.81.down_proj.weight_scale": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.81.gate_proj.weight": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.81.gate_proj.weight_scale": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.81.up_proj.weight": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.81.up_proj.weight_scale": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.82.down_proj.weight": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.82.down_proj.weight_scale": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.82.gate_proj.weight": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.82.gate_proj.weight_scale": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.82.up_proj.weight": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.82.up_proj.weight_scale": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.83.down_proj.weight": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.83.down_proj.weight_scale": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.83.gate_proj.weight": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.83.gate_proj.weight_scale": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.83.up_proj.weight": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.83.up_proj.weight_scale": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.84.down_proj.weight": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.84.down_proj.weight_scale": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.84.gate_proj.weight": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.84.gate_proj.weight_scale": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.84.up_proj.weight": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.84.up_proj.weight_scale": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.85.down_proj.weight": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.85.down_proj.weight_scale": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.85.gate_proj.weight": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.85.gate_proj.weight_scale": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.85.up_proj.weight": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.85.up_proj.weight_scale": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.86.down_proj.weight": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.86.down_proj.weight_scale": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.86.gate_proj.weight": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.86.gate_proj.weight_scale": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.86.up_proj.weight": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.86.up_proj.weight_scale": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.87.down_proj.weight": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.87.down_proj.weight_scale": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.87.gate_proj.weight": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.87.gate_proj.weight_scale": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.87.up_proj.weight": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.87.up_proj.weight_scale": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.88.down_proj.weight": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.88.down_proj.weight_scale": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.88.gate_proj.weight": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.88.gate_proj.weight_scale": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.88.up_proj.weight": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.88.up_proj.weight_scale": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.89.down_proj.weight": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.89.down_proj.weight_scale": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.89.gate_proj.weight": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.89.gate_proj.weight_scale": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.89.up_proj.weight": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.89.up_proj.weight_scale": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.9.down_proj.weight": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.9.down_proj.weight_scale": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.9.gate_proj.weight": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.9.gate_proj.weight_scale": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.9.up_proj.weight": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.9.up_proj.weight_scale": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.90.down_proj.weight": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.90.down_proj.weight_scale": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.90.gate_proj.weight": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.90.gate_proj.weight_scale": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.90.up_proj.weight": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.90.up_proj.weight_scale": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.91.down_proj.weight": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.91.down_proj.weight_scale": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.91.gate_proj.weight": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.91.gate_proj.weight_scale": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.91.up_proj.weight": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.91.up_proj.weight_scale": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.92.down_proj.weight": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.92.down_proj.weight_scale": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.92.gate_proj.weight": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.92.gate_proj.weight_scale": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.92.up_proj.weight": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.92.up_proj.weight_scale": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.93.down_proj.weight": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.93.down_proj.weight_scale": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.93.gate_proj.weight": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.93.gate_proj.weight_scale": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.93.up_proj.weight": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.93.up_proj.weight_scale": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.94.down_proj.weight": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.94.down_proj.weight_scale": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.94.gate_proj.weight": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.94.gate_proj.weight_scale": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.94.up_proj.weight": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.94.up_proj.weight_scale": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.95.down_proj.weight": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.95.down_proj.weight_scale": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.95.gate_proj.weight": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.95.gate_proj.weight_scale": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.95.up_proj.weight": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.95.up_proj.weight_scale": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.96.down_proj.weight": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.96.down_proj.weight_scale": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.96.gate_proj.weight": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.96.gate_proj.weight_scale": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.96.up_proj.weight": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.96.up_proj.weight_scale": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.97.down_proj.weight": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.97.down_proj.weight_scale": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.97.gate_proj.weight": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.97.gate_proj.weight_scale": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.97.up_proj.weight": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.97.up_proj.weight_scale": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.98.down_proj.weight": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.98.down_proj.weight_scale": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.98.gate_proj.weight": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.98.gate_proj.weight_scale": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.98.up_proj.weight": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.98.up_proj.weight_scale": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.99.down_proj.weight": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.99.down_proj.weight_scale": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.99.gate_proj.weight": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.99.gate_proj.weight_scale": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.99.up_proj.weight": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.99.up_proj.weight_scale": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.gate.e_score_correction_bias": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.gate.weight": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.shared_experts.down_proj.weight": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.shared_experts.down_proj.weight_scale": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.shared_experts.gate_proj.weight": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.shared_experts.gate_proj.weight_scale": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.shared_experts.up_proj.weight": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.shared_experts.up_proj.weight_scale": "model-00050-of-00092.safetensors",
+ "model.layers.49.post_attention_layernorm.weight": "model-00050-of-00092.safetensors",
+ "model.layers.49.self_attn.k_norm.weight": "model-00050-of-00092.safetensors",
+ "model.layers.49.self_attn.k_proj.bias": "model-00050-of-00092.safetensors",
+ "model.layers.49.self_attn.k_proj.weight": "model-00050-of-00092.safetensors",
+ "model.layers.49.self_attn.k_proj.weight_scale": "model-00050-of-00092.safetensors",
+ "model.layers.49.self_attn.o_proj.weight": "model-00050-of-00092.safetensors",
+ "model.layers.49.self_attn.o_proj.weight_scale": "model-00050-of-00092.safetensors",
+ "model.layers.49.self_attn.q_norm.weight": "model-00050-of-00092.safetensors",
+ "model.layers.49.self_attn.q_proj.bias": "model-00050-of-00092.safetensors",
+ "model.layers.49.self_attn.q_proj.weight": "model-00050-of-00092.safetensors",
+ "model.layers.49.self_attn.q_proj.weight_scale": "model-00050-of-00092.safetensors",
+ "model.layers.49.self_attn.v_proj.bias": "model-00050-of-00092.safetensors",
+ "model.layers.49.self_attn.v_proj.weight": "model-00050-of-00092.safetensors",
+ "model.layers.49.self_attn.v_proj.weight_scale": "model-00050-of-00092.safetensors",
+ "model.layers.50.input_layernorm.weight": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.0.down_proj.weight": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.0.down_proj.weight_scale": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.0.gate_proj.weight": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.0.gate_proj.weight_scale": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.0.up_proj.weight": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.0.up_proj.weight_scale": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.1.down_proj.weight": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.1.down_proj.weight_scale": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.1.gate_proj.weight": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.1.gate_proj.weight_scale": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.1.up_proj.weight": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.1.up_proj.weight_scale": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.10.down_proj.weight": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.10.down_proj.weight_scale": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.10.gate_proj.weight": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.10.gate_proj.weight_scale": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.10.up_proj.weight": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.10.up_proj.weight_scale": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.100.down_proj.weight": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.100.down_proj.weight_scale": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.100.gate_proj.weight": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.100.gate_proj.weight_scale": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.100.up_proj.weight": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.100.up_proj.weight_scale": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.101.down_proj.weight": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.101.down_proj.weight_scale": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.101.gate_proj.weight": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.101.gate_proj.weight_scale": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.101.up_proj.weight": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.101.up_proj.weight_scale": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.102.down_proj.weight": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.102.down_proj.weight_scale": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.102.gate_proj.weight": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.102.gate_proj.weight_scale": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.102.up_proj.weight": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.102.up_proj.weight_scale": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.103.down_proj.weight": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.103.down_proj.weight_scale": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.103.gate_proj.weight": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.103.gate_proj.weight_scale": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.103.up_proj.weight": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.103.up_proj.weight_scale": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.104.down_proj.weight": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.104.down_proj.weight_scale": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.104.gate_proj.weight": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.104.gate_proj.weight_scale": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.104.up_proj.weight": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.104.up_proj.weight_scale": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.105.down_proj.weight": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.105.down_proj.weight_scale": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.105.gate_proj.weight": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.105.gate_proj.weight_scale": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.105.up_proj.weight": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.105.up_proj.weight_scale": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.106.down_proj.weight": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.106.down_proj.weight_scale": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.106.gate_proj.weight": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.106.gate_proj.weight_scale": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.106.up_proj.weight": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.106.up_proj.weight_scale": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.107.down_proj.weight": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.107.down_proj.weight_scale": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.107.gate_proj.weight": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.107.gate_proj.weight_scale": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.107.up_proj.weight": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.107.up_proj.weight_scale": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.108.down_proj.weight": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.108.down_proj.weight_scale": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.108.gate_proj.weight": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.108.gate_proj.weight_scale": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.108.up_proj.weight": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.108.up_proj.weight_scale": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.109.down_proj.weight": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.109.down_proj.weight_scale": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.109.gate_proj.weight": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.109.gate_proj.weight_scale": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.109.up_proj.weight": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.109.up_proj.weight_scale": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.11.down_proj.weight": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.11.down_proj.weight_scale": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.11.gate_proj.weight": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.11.gate_proj.weight_scale": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.11.up_proj.weight": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.11.up_proj.weight_scale": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.110.down_proj.weight": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.110.down_proj.weight_scale": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.110.gate_proj.weight": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.110.gate_proj.weight_scale": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.110.up_proj.weight": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.110.up_proj.weight_scale": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.111.down_proj.weight": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.111.down_proj.weight_scale": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.111.gate_proj.weight": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.111.gate_proj.weight_scale": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.111.up_proj.weight": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.111.up_proj.weight_scale": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.112.down_proj.weight": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.112.down_proj.weight_scale": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.112.gate_proj.weight": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.112.gate_proj.weight_scale": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.112.up_proj.weight": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.112.up_proj.weight_scale": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.113.down_proj.weight": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.113.down_proj.weight_scale": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.113.gate_proj.weight": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.113.gate_proj.weight_scale": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.113.up_proj.weight": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.113.up_proj.weight_scale": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.114.down_proj.weight": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.114.down_proj.weight_scale": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.114.gate_proj.weight": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.114.gate_proj.weight_scale": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.114.up_proj.weight": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.114.up_proj.weight_scale": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.115.down_proj.weight": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.115.down_proj.weight_scale": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.115.gate_proj.weight": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.115.gate_proj.weight_scale": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.115.up_proj.weight": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.115.up_proj.weight_scale": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.116.down_proj.weight": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.116.down_proj.weight_scale": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.116.gate_proj.weight": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.116.gate_proj.weight_scale": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.116.up_proj.weight": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.116.up_proj.weight_scale": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.117.down_proj.weight": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.117.down_proj.weight_scale": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.117.gate_proj.weight": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.117.gate_proj.weight_scale": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.117.up_proj.weight": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.117.up_proj.weight_scale": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.118.down_proj.weight": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.118.down_proj.weight_scale": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.118.gate_proj.weight": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.118.gate_proj.weight_scale": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.118.up_proj.weight": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.118.up_proj.weight_scale": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.119.down_proj.weight": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.119.down_proj.weight_scale": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.119.gate_proj.weight": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.119.gate_proj.weight_scale": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.119.up_proj.weight": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.119.up_proj.weight_scale": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.12.down_proj.weight": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.12.down_proj.weight_scale": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.12.gate_proj.weight": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.12.gate_proj.weight_scale": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.12.up_proj.weight": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.12.up_proj.weight_scale": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.120.down_proj.weight": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.120.down_proj.weight_scale": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.120.gate_proj.weight": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.120.gate_proj.weight_scale": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.120.up_proj.weight": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.120.up_proj.weight_scale": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.121.down_proj.weight": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.121.down_proj.weight_scale": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.121.gate_proj.weight": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.121.gate_proj.weight_scale": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.121.up_proj.weight": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.121.up_proj.weight_scale": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.122.down_proj.weight": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.122.down_proj.weight_scale": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.122.gate_proj.weight": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.122.gate_proj.weight_scale": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.122.up_proj.weight": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.122.up_proj.weight_scale": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.123.down_proj.weight": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.123.down_proj.weight_scale": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.123.gate_proj.weight": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.123.gate_proj.weight_scale": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.123.up_proj.weight": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.123.up_proj.weight_scale": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.124.down_proj.weight": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.124.down_proj.weight_scale": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.124.gate_proj.weight": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.124.gate_proj.weight_scale": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.124.up_proj.weight": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.124.up_proj.weight_scale": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.125.down_proj.weight": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.125.down_proj.weight_scale": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.125.gate_proj.weight": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.125.gate_proj.weight_scale": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.125.up_proj.weight": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.125.up_proj.weight_scale": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.126.down_proj.weight": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.126.down_proj.weight_scale": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.126.gate_proj.weight": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.126.gate_proj.weight_scale": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.126.up_proj.weight": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.126.up_proj.weight_scale": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.127.down_proj.weight": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.127.down_proj.weight_scale": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.127.gate_proj.weight": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.127.gate_proj.weight_scale": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.127.up_proj.weight": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.127.up_proj.weight_scale": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.128.down_proj.weight": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.128.down_proj.weight_scale": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.128.gate_proj.weight": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.128.gate_proj.weight_scale": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.128.up_proj.weight": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.128.up_proj.weight_scale": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.129.down_proj.weight": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.129.down_proj.weight_scale": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.129.gate_proj.weight": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.129.gate_proj.weight_scale": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.129.up_proj.weight": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.129.up_proj.weight_scale": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.13.down_proj.weight": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.13.down_proj.weight_scale": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.13.gate_proj.weight": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.13.gate_proj.weight_scale": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.13.up_proj.weight": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.13.up_proj.weight_scale": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.130.down_proj.weight": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.130.down_proj.weight_scale": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.130.gate_proj.weight": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.130.gate_proj.weight_scale": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.130.up_proj.weight": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.130.up_proj.weight_scale": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.131.down_proj.weight": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.131.down_proj.weight_scale": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.131.gate_proj.weight": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.131.gate_proj.weight_scale": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.131.up_proj.weight": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.131.up_proj.weight_scale": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.132.down_proj.weight": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.132.down_proj.weight_scale": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.132.gate_proj.weight": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.132.gate_proj.weight_scale": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.132.up_proj.weight": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.132.up_proj.weight_scale": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.133.down_proj.weight": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.133.down_proj.weight_scale": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.133.gate_proj.weight": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.133.gate_proj.weight_scale": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.133.up_proj.weight": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.133.up_proj.weight_scale": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.134.down_proj.weight": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.134.down_proj.weight_scale": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.134.gate_proj.weight": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.134.gate_proj.weight_scale": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.134.up_proj.weight": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.134.up_proj.weight_scale": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.135.down_proj.weight": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.135.down_proj.weight_scale": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.135.gate_proj.weight": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.135.gate_proj.weight_scale": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.135.up_proj.weight": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.135.up_proj.weight_scale": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.136.down_proj.weight": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.136.down_proj.weight_scale": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.136.gate_proj.weight": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.136.gate_proj.weight_scale": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.136.up_proj.weight": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.136.up_proj.weight_scale": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.137.down_proj.weight": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.137.down_proj.weight_scale": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.137.gate_proj.weight": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.137.gate_proj.weight_scale": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.137.up_proj.weight": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.137.up_proj.weight_scale": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.138.down_proj.weight": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.138.down_proj.weight_scale": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.138.gate_proj.weight": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.138.gate_proj.weight_scale": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.138.up_proj.weight": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.138.up_proj.weight_scale": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.139.down_proj.weight": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.139.down_proj.weight_scale": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.139.gate_proj.weight": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.139.gate_proj.weight_scale": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.139.up_proj.weight": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.139.up_proj.weight_scale": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.14.down_proj.weight": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.14.down_proj.weight_scale": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.14.gate_proj.weight": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.14.gate_proj.weight_scale": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.14.up_proj.weight": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.14.up_proj.weight_scale": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.140.down_proj.weight": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.140.down_proj.weight_scale": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.140.gate_proj.weight": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.140.gate_proj.weight_scale": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.140.up_proj.weight": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.140.up_proj.weight_scale": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.141.down_proj.weight": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.141.down_proj.weight_scale": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.141.gate_proj.weight": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.141.gate_proj.weight_scale": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.141.up_proj.weight": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.141.up_proj.weight_scale": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.142.down_proj.weight": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.142.down_proj.weight_scale": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.142.gate_proj.weight": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.142.gate_proj.weight_scale": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.142.up_proj.weight": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.142.up_proj.weight_scale": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.143.down_proj.weight": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.143.down_proj.weight_scale": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.143.gate_proj.weight": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.143.gate_proj.weight_scale": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.143.up_proj.weight": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.143.up_proj.weight_scale": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.144.down_proj.weight": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.144.down_proj.weight_scale": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.144.gate_proj.weight": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.144.gate_proj.weight_scale": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.144.up_proj.weight": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.144.up_proj.weight_scale": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.145.down_proj.weight": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.145.down_proj.weight_scale": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.145.gate_proj.weight": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.145.gate_proj.weight_scale": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.145.up_proj.weight": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.145.up_proj.weight_scale": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.146.down_proj.weight": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.146.down_proj.weight_scale": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.146.gate_proj.weight": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.146.gate_proj.weight_scale": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.146.up_proj.weight": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.146.up_proj.weight_scale": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.147.down_proj.weight": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.147.down_proj.weight_scale": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.147.gate_proj.weight": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.147.gate_proj.weight_scale": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.147.up_proj.weight": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.147.up_proj.weight_scale": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.148.down_proj.weight": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.148.down_proj.weight_scale": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.148.gate_proj.weight": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.148.gate_proj.weight_scale": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.148.up_proj.weight": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.148.up_proj.weight_scale": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.149.down_proj.weight": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.149.down_proj.weight_scale": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.149.gate_proj.weight": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.149.gate_proj.weight_scale": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.149.up_proj.weight": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.149.up_proj.weight_scale": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.15.down_proj.weight": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.15.down_proj.weight_scale": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.15.gate_proj.weight": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.15.gate_proj.weight_scale": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.15.up_proj.weight": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.15.up_proj.weight_scale": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.150.down_proj.weight": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.150.down_proj.weight_scale": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.150.gate_proj.weight": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.150.gate_proj.weight_scale": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.150.up_proj.weight": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.150.up_proj.weight_scale": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.151.down_proj.weight": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.151.down_proj.weight_scale": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.151.gate_proj.weight": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.151.gate_proj.weight_scale": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.151.up_proj.weight": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.151.up_proj.weight_scale": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.152.down_proj.weight": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.152.down_proj.weight_scale": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.152.gate_proj.weight": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.152.gate_proj.weight_scale": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.152.up_proj.weight": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.152.up_proj.weight_scale": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.153.down_proj.weight": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.153.down_proj.weight_scale": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.153.gate_proj.weight": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.153.gate_proj.weight_scale": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.153.up_proj.weight": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.153.up_proj.weight_scale": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.154.down_proj.weight": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.154.down_proj.weight_scale": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.154.gate_proj.weight": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.154.gate_proj.weight_scale": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.154.up_proj.weight": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.154.up_proj.weight_scale": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.155.down_proj.weight": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.155.down_proj.weight_scale": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.155.gate_proj.weight": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.155.gate_proj.weight_scale": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.155.up_proj.weight": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.155.up_proj.weight_scale": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.156.down_proj.weight": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.156.down_proj.weight_scale": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.156.gate_proj.weight": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.156.gate_proj.weight_scale": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.156.up_proj.weight": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.156.up_proj.weight_scale": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.157.down_proj.weight": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.157.down_proj.weight_scale": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.157.gate_proj.weight": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.157.gate_proj.weight_scale": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.157.up_proj.weight": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.157.up_proj.weight_scale": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.158.down_proj.weight": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.158.down_proj.weight_scale": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.158.gate_proj.weight": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.158.gate_proj.weight_scale": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.158.up_proj.weight": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.158.up_proj.weight_scale": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.159.down_proj.weight": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.159.down_proj.weight_scale": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.159.gate_proj.weight": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.159.gate_proj.weight_scale": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.159.up_proj.weight": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.159.up_proj.weight_scale": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.16.down_proj.weight": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.16.down_proj.weight_scale": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.16.gate_proj.weight": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.16.gate_proj.weight_scale": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.16.up_proj.weight": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.16.up_proj.weight_scale": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.17.down_proj.weight": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.17.down_proj.weight_scale": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.17.gate_proj.weight": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.17.gate_proj.weight_scale": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.17.up_proj.weight": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.17.up_proj.weight_scale": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.18.down_proj.weight": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.18.down_proj.weight_scale": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.18.gate_proj.weight": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.18.gate_proj.weight_scale": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.18.up_proj.weight": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.18.up_proj.weight_scale": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.19.down_proj.weight": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.19.down_proj.weight_scale": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.19.gate_proj.weight": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.19.gate_proj.weight_scale": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.19.up_proj.weight": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.19.up_proj.weight_scale": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.2.down_proj.weight": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.2.down_proj.weight_scale": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.2.gate_proj.weight": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.2.gate_proj.weight_scale": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.2.up_proj.weight": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.2.up_proj.weight_scale": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.20.down_proj.weight": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.20.down_proj.weight_scale": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.20.gate_proj.weight": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.20.gate_proj.weight_scale": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.20.up_proj.weight": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.20.up_proj.weight_scale": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.21.down_proj.weight": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.21.down_proj.weight_scale": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.21.gate_proj.weight": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.21.gate_proj.weight_scale": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.21.up_proj.weight": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.21.up_proj.weight_scale": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.22.down_proj.weight": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.22.down_proj.weight_scale": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.22.gate_proj.weight": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.22.gate_proj.weight_scale": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.22.up_proj.weight": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.22.up_proj.weight_scale": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.23.down_proj.weight": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.23.down_proj.weight_scale": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.23.gate_proj.weight": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.23.gate_proj.weight_scale": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.23.up_proj.weight": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.23.up_proj.weight_scale": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.24.down_proj.weight": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.24.down_proj.weight_scale": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.24.gate_proj.weight": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.24.gate_proj.weight_scale": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.24.up_proj.weight": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.24.up_proj.weight_scale": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.25.down_proj.weight": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.25.down_proj.weight_scale": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.25.gate_proj.weight": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.25.gate_proj.weight_scale": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.25.up_proj.weight": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.25.up_proj.weight_scale": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.26.down_proj.weight": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.26.down_proj.weight_scale": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.26.gate_proj.weight": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.26.gate_proj.weight_scale": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.26.up_proj.weight": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.26.up_proj.weight_scale": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.27.down_proj.weight": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.27.down_proj.weight_scale": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.27.gate_proj.weight": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.27.gate_proj.weight_scale": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.27.up_proj.weight": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.27.up_proj.weight_scale": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.28.down_proj.weight": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.28.down_proj.weight_scale": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.28.gate_proj.weight": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.28.gate_proj.weight_scale": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.28.up_proj.weight": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.28.up_proj.weight_scale": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.29.down_proj.weight": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.29.down_proj.weight_scale": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.29.gate_proj.weight": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.29.gate_proj.weight_scale": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.29.up_proj.weight": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.29.up_proj.weight_scale": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.3.down_proj.weight": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.3.down_proj.weight_scale": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.3.gate_proj.weight": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.3.gate_proj.weight_scale": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.3.up_proj.weight": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.3.up_proj.weight_scale": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.30.down_proj.weight": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.30.down_proj.weight_scale": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.30.gate_proj.weight": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.30.gate_proj.weight_scale": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.30.up_proj.weight": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.30.up_proj.weight_scale": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.31.down_proj.weight": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.31.down_proj.weight_scale": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.31.gate_proj.weight": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.31.gate_proj.weight_scale": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.31.up_proj.weight": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.31.up_proj.weight_scale": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.32.down_proj.weight": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.32.down_proj.weight_scale": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.32.gate_proj.weight": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.32.gate_proj.weight_scale": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.32.up_proj.weight": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.32.up_proj.weight_scale": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.33.down_proj.weight": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.33.down_proj.weight_scale": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.33.gate_proj.weight": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.33.gate_proj.weight_scale": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.33.up_proj.weight": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.33.up_proj.weight_scale": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.34.down_proj.weight": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.34.down_proj.weight_scale": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.34.gate_proj.weight": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.34.gate_proj.weight_scale": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.34.up_proj.weight": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.34.up_proj.weight_scale": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.35.down_proj.weight": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.35.down_proj.weight_scale": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.35.gate_proj.weight": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.35.gate_proj.weight_scale": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.35.up_proj.weight": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.35.up_proj.weight_scale": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.36.down_proj.weight": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.36.down_proj.weight_scale": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.36.gate_proj.weight": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.36.gate_proj.weight_scale": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.36.up_proj.weight": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.36.up_proj.weight_scale": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.37.down_proj.weight": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.37.down_proj.weight_scale": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.37.gate_proj.weight": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.37.gate_proj.weight_scale": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.37.up_proj.weight": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.37.up_proj.weight_scale": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.38.down_proj.weight": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.38.down_proj.weight_scale": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.38.gate_proj.weight": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.38.gate_proj.weight_scale": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.38.up_proj.weight": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.38.up_proj.weight_scale": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.39.down_proj.weight": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.39.down_proj.weight_scale": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.39.gate_proj.weight": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.39.gate_proj.weight_scale": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.39.up_proj.weight": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.39.up_proj.weight_scale": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.4.down_proj.weight": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.4.down_proj.weight_scale": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.4.gate_proj.weight": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.4.gate_proj.weight_scale": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.4.up_proj.weight": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.4.up_proj.weight_scale": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.40.down_proj.weight": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.40.down_proj.weight_scale": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.40.gate_proj.weight": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.40.gate_proj.weight_scale": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.40.up_proj.weight": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.40.up_proj.weight_scale": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.41.down_proj.weight": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.41.down_proj.weight_scale": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.41.gate_proj.weight": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.41.gate_proj.weight_scale": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.41.up_proj.weight": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.41.up_proj.weight_scale": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.42.down_proj.weight": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.42.down_proj.weight_scale": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.42.gate_proj.weight": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.42.gate_proj.weight_scale": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.42.up_proj.weight": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.42.up_proj.weight_scale": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.43.down_proj.weight": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.43.down_proj.weight_scale": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.43.gate_proj.weight": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.43.gate_proj.weight_scale": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.43.up_proj.weight": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.43.up_proj.weight_scale": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.44.down_proj.weight": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.44.down_proj.weight_scale": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.44.gate_proj.weight": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.44.gate_proj.weight_scale": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.44.up_proj.weight": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.44.up_proj.weight_scale": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.45.down_proj.weight": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.45.down_proj.weight_scale": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.45.gate_proj.weight": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.45.gate_proj.weight_scale": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.45.up_proj.weight": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.45.up_proj.weight_scale": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.46.down_proj.weight": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.46.down_proj.weight_scale": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.46.gate_proj.weight": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.46.gate_proj.weight_scale": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.46.up_proj.weight": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.46.up_proj.weight_scale": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.47.down_proj.weight": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.47.down_proj.weight_scale": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.47.gate_proj.weight": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.47.gate_proj.weight_scale": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.47.up_proj.weight": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.47.up_proj.weight_scale": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.48.down_proj.weight": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.48.down_proj.weight_scale": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.48.gate_proj.weight": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.48.gate_proj.weight_scale": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.48.up_proj.weight": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.48.up_proj.weight_scale": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.49.down_proj.weight": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.49.down_proj.weight_scale": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.49.gate_proj.weight": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.49.gate_proj.weight_scale": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.49.up_proj.weight": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.49.up_proj.weight_scale": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.5.down_proj.weight": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.5.down_proj.weight_scale": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.5.gate_proj.weight": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.5.gate_proj.weight_scale": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.5.up_proj.weight": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.5.up_proj.weight_scale": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.50.down_proj.weight": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.50.down_proj.weight_scale": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.50.gate_proj.weight": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.50.gate_proj.weight_scale": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.50.up_proj.weight": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.50.up_proj.weight_scale": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.51.down_proj.weight": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.51.down_proj.weight_scale": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.51.gate_proj.weight": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.51.gate_proj.weight_scale": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.51.up_proj.weight": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.51.up_proj.weight_scale": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.52.down_proj.weight": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.52.down_proj.weight_scale": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.52.gate_proj.weight": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.52.gate_proj.weight_scale": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.52.up_proj.weight": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.52.up_proj.weight_scale": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.53.down_proj.weight": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.53.down_proj.weight_scale": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.53.gate_proj.weight": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.53.gate_proj.weight_scale": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.53.up_proj.weight": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.53.up_proj.weight_scale": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.54.down_proj.weight": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.54.down_proj.weight_scale": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.54.gate_proj.weight": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.54.gate_proj.weight_scale": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.54.up_proj.weight": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.54.up_proj.weight_scale": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.55.down_proj.weight": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.55.down_proj.weight_scale": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.55.gate_proj.weight": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.55.gate_proj.weight_scale": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.55.up_proj.weight": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.55.up_proj.weight_scale": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.56.down_proj.weight": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.56.down_proj.weight_scale": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.56.gate_proj.weight": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.56.gate_proj.weight_scale": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.56.up_proj.weight": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.56.up_proj.weight_scale": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.57.down_proj.weight": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.57.down_proj.weight_scale": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.57.gate_proj.weight": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.57.gate_proj.weight_scale": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.57.up_proj.weight": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.57.up_proj.weight_scale": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.58.down_proj.weight": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.58.down_proj.weight_scale": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.58.gate_proj.weight": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.58.gate_proj.weight_scale": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.58.up_proj.weight": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.58.up_proj.weight_scale": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.59.down_proj.weight": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.59.down_proj.weight_scale": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.59.gate_proj.weight": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.59.gate_proj.weight_scale": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.59.up_proj.weight": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.59.up_proj.weight_scale": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.6.down_proj.weight": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.6.down_proj.weight_scale": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.6.gate_proj.weight": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.6.gate_proj.weight_scale": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.6.up_proj.weight": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.6.up_proj.weight_scale": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.60.down_proj.weight": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.60.down_proj.weight_scale": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.60.gate_proj.weight": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.60.gate_proj.weight_scale": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.60.up_proj.weight": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.60.up_proj.weight_scale": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.61.down_proj.weight": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.61.down_proj.weight_scale": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.61.gate_proj.weight": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.61.gate_proj.weight_scale": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.61.up_proj.weight": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.61.up_proj.weight_scale": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.62.down_proj.weight": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.62.down_proj.weight_scale": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.62.gate_proj.weight": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.62.gate_proj.weight_scale": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.62.up_proj.weight": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.62.up_proj.weight_scale": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.63.down_proj.weight": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.63.down_proj.weight_scale": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.63.gate_proj.weight": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.63.gate_proj.weight_scale": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.63.up_proj.weight": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.63.up_proj.weight_scale": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.64.down_proj.weight": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.64.down_proj.weight_scale": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.64.gate_proj.weight": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.64.gate_proj.weight_scale": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.64.up_proj.weight": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.64.up_proj.weight_scale": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.65.down_proj.weight": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.65.down_proj.weight_scale": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.65.gate_proj.weight": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.65.gate_proj.weight_scale": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.65.up_proj.weight": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.65.up_proj.weight_scale": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.66.down_proj.weight": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.66.down_proj.weight_scale": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.66.gate_proj.weight": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.66.gate_proj.weight_scale": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.66.up_proj.weight": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.66.up_proj.weight_scale": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.67.down_proj.weight": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.67.down_proj.weight_scale": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.67.gate_proj.weight": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.67.gate_proj.weight_scale": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.67.up_proj.weight": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.67.up_proj.weight_scale": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.68.down_proj.weight": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.68.down_proj.weight_scale": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.68.gate_proj.weight": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.68.gate_proj.weight_scale": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.68.up_proj.weight": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.68.up_proj.weight_scale": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.69.down_proj.weight": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.69.down_proj.weight_scale": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.69.gate_proj.weight": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.69.gate_proj.weight_scale": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.69.up_proj.weight": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.69.up_proj.weight_scale": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.7.down_proj.weight": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.7.down_proj.weight_scale": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.7.gate_proj.weight": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.7.gate_proj.weight_scale": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.7.up_proj.weight": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.7.up_proj.weight_scale": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.70.down_proj.weight": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.70.down_proj.weight_scale": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.70.gate_proj.weight": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.70.gate_proj.weight_scale": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.70.up_proj.weight": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.70.up_proj.weight_scale": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.71.down_proj.weight": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.71.down_proj.weight_scale": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.71.gate_proj.weight": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.71.gate_proj.weight_scale": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.71.up_proj.weight": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.71.up_proj.weight_scale": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.72.down_proj.weight": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.72.down_proj.weight_scale": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.72.gate_proj.weight": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.72.gate_proj.weight_scale": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.72.up_proj.weight": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.72.up_proj.weight_scale": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.73.down_proj.weight": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.73.down_proj.weight_scale": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.73.gate_proj.weight": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.73.gate_proj.weight_scale": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.73.up_proj.weight": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.73.up_proj.weight_scale": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.74.down_proj.weight": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.74.down_proj.weight_scale": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.74.gate_proj.weight": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.74.gate_proj.weight_scale": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.74.up_proj.weight": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.74.up_proj.weight_scale": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.75.down_proj.weight": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.75.down_proj.weight_scale": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.75.gate_proj.weight": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.75.gate_proj.weight_scale": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.75.up_proj.weight": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.75.up_proj.weight_scale": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.76.down_proj.weight": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.76.down_proj.weight_scale": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.76.gate_proj.weight": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.76.gate_proj.weight_scale": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.76.up_proj.weight": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.76.up_proj.weight_scale": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.77.down_proj.weight": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.77.down_proj.weight_scale": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.77.gate_proj.weight": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.77.gate_proj.weight_scale": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.77.up_proj.weight": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.77.up_proj.weight_scale": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.78.down_proj.weight": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.78.down_proj.weight_scale": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.78.gate_proj.weight": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.78.gate_proj.weight_scale": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.78.up_proj.weight": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.78.up_proj.weight_scale": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.79.down_proj.weight": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.79.down_proj.weight_scale": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.79.gate_proj.weight": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.79.gate_proj.weight_scale": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.79.up_proj.weight": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.79.up_proj.weight_scale": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.8.down_proj.weight": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.8.down_proj.weight_scale": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.8.gate_proj.weight": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.8.gate_proj.weight_scale": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.8.up_proj.weight": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.8.up_proj.weight_scale": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.80.down_proj.weight": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.80.down_proj.weight_scale": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.80.gate_proj.weight": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.80.gate_proj.weight_scale": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.80.up_proj.weight": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.80.up_proj.weight_scale": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.81.down_proj.weight": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.81.down_proj.weight_scale": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.81.gate_proj.weight": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.81.gate_proj.weight_scale": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.81.up_proj.weight": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.81.up_proj.weight_scale": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.82.down_proj.weight": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.82.down_proj.weight_scale": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.82.gate_proj.weight": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.82.gate_proj.weight_scale": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.82.up_proj.weight": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.82.up_proj.weight_scale": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.83.down_proj.weight": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.83.down_proj.weight_scale": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.83.gate_proj.weight": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.83.gate_proj.weight_scale": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.83.up_proj.weight": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.83.up_proj.weight_scale": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.84.down_proj.weight": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.84.down_proj.weight_scale": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.84.gate_proj.weight": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.84.gate_proj.weight_scale": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.84.up_proj.weight": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.84.up_proj.weight_scale": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.85.down_proj.weight": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.85.down_proj.weight_scale": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.85.gate_proj.weight": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.85.gate_proj.weight_scale": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.85.up_proj.weight": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.85.up_proj.weight_scale": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.86.down_proj.weight": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.86.down_proj.weight_scale": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.86.gate_proj.weight": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.86.gate_proj.weight_scale": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.86.up_proj.weight": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.86.up_proj.weight_scale": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.87.down_proj.weight": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.87.down_proj.weight_scale": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.87.gate_proj.weight": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.87.gate_proj.weight_scale": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.87.up_proj.weight": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.87.up_proj.weight_scale": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.88.down_proj.weight": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.88.down_proj.weight_scale": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.88.gate_proj.weight": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.88.gate_proj.weight_scale": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.88.up_proj.weight": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.88.up_proj.weight_scale": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.89.down_proj.weight": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.89.down_proj.weight_scale": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.89.gate_proj.weight": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.89.gate_proj.weight_scale": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.89.up_proj.weight": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.89.up_proj.weight_scale": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.9.down_proj.weight": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.9.down_proj.weight_scale": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.9.gate_proj.weight": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.9.gate_proj.weight_scale": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.9.up_proj.weight": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.9.up_proj.weight_scale": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.90.down_proj.weight": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.90.down_proj.weight_scale": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.90.gate_proj.weight": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.90.gate_proj.weight_scale": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.90.up_proj.weight": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.90.up_proj.weight_scale": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.91.down_proj.weight": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.91.down_proj.weight_scale": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.91.gate_proj.weight": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.91.gate_proj.weight_scale": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.91.up_proj.weight": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.91.up_proj.weight_scale": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.92.down_proj.weight": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.92.down_proj.weight_scale": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.92.gate_proj.weight": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.92.gate_proj.weight_scale": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.92.up_proj.weight": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.92.up_proj.weight_scale": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.93.down_proj.weight": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.93.down_proj.weight_scale": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.93.gate_proj.weight": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.93.gate_proj.weight_scale": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.93.up_proj.weight": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.93.up_proj.weight_scale": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.94.down_proj.weight": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.94.down_proj.weight_scale": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.94.gate_proj.weight": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.94.gate_proj.weight_scale": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.94.up_proj.weight": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.94.up_proj.weight_scale": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.95.down_proj.weight": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.95.down_proj.weight_scale": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.95.gate_proj.weight": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.95.gate_proj.weight_scale": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.95.up_proj.weight": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.95.up_proj.weight_scale": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.96.down_proj.weight": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.96.down_proj.weight_scale": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.96.gate_proj.weight": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.96.gate_proj.weight_scale": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.96.up_proj.weight": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.96.up_proj.weight_scale": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.97.down_proj.weight": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.97.down_proj.weight_scale": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.97.gate_proj.weight": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.97.gate_proj.weight_scale": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.97.up_proj.weight": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.97.up_proj.weight_scale": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.98.down_proj.weight": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.98.down_proj.weight_scale": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.98.gate_proj.weight": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.98.gate_proj.weight_scale": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.98.up_proj.weight": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.98.up_proj.weight_scale": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.99.down_proj.weight": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.99.down_proj.weight_scale": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.99.gate_proj.weight": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.99.gate_proj.weight_scale": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.99.up_proj.weight": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.99.up_proj.weight_scale": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.gate.e_score_correction_bias": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.gate.weight": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.shared_experts.down_proj.weight": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.shared_experts.down_proj.weight_scale": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.shared_experts.gate_proj.weight": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.shared_experts.gate_proj.weight_scale": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.shared_experts.up_proj.weight": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.shared_experts.up_proj.weight_scale": "model-00051-of-00092.safetensors",
+ "model.layers.50.post_attention_layernorm.weight": "model-00051-of-00092.safetensors",
+ "model.layers.50.self_attn.k_norm.weight": "model-00051-of-00092.safetensors",
+ "model.layers.50.self_attn.k_proj.bias": "model-00051-of-00092.safetensors",
+ "model.layers.50.self_attn.k_proj.weight": "model-00051-of-00092.safetensors",
+ "model.layers.50.self_attn.k_proj.weight_scale": "model-00051-of-00092.safetensors",
+ "model.layers.50.self_attn.o_proj.weight": "model-00051-of-00092.safetensors",
+ "model.layers.50.self_attn.o_proj.weight_scale": "model-00051-of-00092.safetensors",
+ "model.layers.50.self_attn.q_norm.weight": "model-00051-of-00092.safetensors",
+ "model.layers.50.self_attn.q_proj.bias": "model-00051-of-00092.safetensors",
+ "model.layers.50.self_attn.q_proj.weight": "model-00051-of-00092.safetensors",
+ "model.layers.50.self_attn.q_proj.weight_scale": "model-00051-of-00092.safetensors",
+ "model.layers.50.self_attn.v_proj.bias": "model-00051-of-00092.safetensors",
+ "model.layers.50.self_attn.v_proj.weight": "model-00051-of-00092.safetensors",
+ "model.layers.50.self_attn.v_proj.weight_scale": "model-00051-of-00092.safetensors",
+ "model.layers.51.input_layernorm.weight": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.0.down_proj.weight": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.0.down_proj.weight_scale": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.0.gate_proj.weight": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.0.gate_proj.weight_scale": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.0.up_proj.weight": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.0.up_proj.weight_scale": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.1.down_proj.weight": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.1.down_proj.weight_scale": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.1.gate_proj.weight": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.1.gate_proj.weight_scale": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.1.up_proj.weight": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.1.up_proj.weight_scale": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.10.down_proj.weight": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.10.down_proj.weight_scale": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.10.gate_proj.weight": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.10.gate_proj.weight_scale": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.10.up_proj.weight": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.10.up_proj.weight_scale": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.100.down_proj.weight": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.100.down_proj.weight_scale": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.100.gate_proj.weight": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.100.gate_proj.weight_scale": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.100.up_proj.weight": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.100.up_proj.weight_scale": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.101.down_proj.weight": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.101.down_proj.weight_scale": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.101.gate_proj.weight": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.101.gate_proj.weight_scale": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.101.up_proj.weight": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.101.up_proj.weight_scale": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.102.down_proj.weight": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.102.down_proj.weight_scale": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.102.gate_proj.weight": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.102.gate_proj.weight_scale": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.102.up_proj.weight": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.102.up_proj.weight_scale": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.103.down_proj.weight": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.103.down_proj.weight_scale": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.103.gate_proj.weight": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.103.gate_proj.weight_scale": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.103.up_proj.weight": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.103.up_proj.weight_scale": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.104.down_proj.weight": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.104.down_proj.weight_scale": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.104.gate_proj.weight": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.104.gate_proj.weight_scale": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.104.up_proj.weight": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.104.up_proj.weight_scale": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.105.down_proj.weight": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.105.down_proj.weight_scale": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.105.gate_proj.weight": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.105.gate_proj.weight_scale": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.105.up_proj.weight": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.105.up_proj.weight_scale": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.106.down_proj.weight": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.106.down_proj.weight_scale": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.106.gate_proj.weight": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.106.gate_proj.weight_scale": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.106.up_proj.weight": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.106.up_proj.weight_scale": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.107.down_proj.weight": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.107.down_proj.weight_scale": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.107.gate_proj.weight": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.107.gate_proj.weight_scale": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.107.up_proj.weight": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.107.up_proj.weight_scale": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.108.down_proj.weight": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.108.down_proj.weight_scale": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.108.gate_proj.weight": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.108.gate_proj.weight_scale": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.108.up_proj.weight": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.108.up_proj.weight_scale": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.109.down_proj.weight": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.109.down_proj.weight_scale": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.109.gate_proj.weight": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.109.gate_proj.weight_scale": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.109.up_proj.weight": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.109.up_proj.weight_scale": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.11.down_proj.weight": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.11.down_proj.weight_scale": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.11.gate_proj.weight": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.11.gate_proj.weight_scale": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.11.up_proj.weight": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.11.up_proj.weight_scale": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.110.down_proj.weight": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.110.down_proj.weight_scale": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.110.gate_proj.weight": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.110.gate_proj.weight_scale": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.110.up_proj.weight": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.110.up_proj.weight_scale": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.111.down_proj.weight": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.111.down_proj.weight_scale": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.111.gate_proj.weight": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.111.gate_proj.weight_scale": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.111.up_proj.weight": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.111.up_proj.weight_scale": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.112.down_proj.weight": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.112.down_proj.weight_scale": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.112.gate_proj.weight": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.112.gate_proj.weight_scale": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.112.up_proj.weight": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.112.up_proj.weight_scale": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.113.down_proj.weight": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.113.down_proj.weight_scale": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.113.gate_proj.weight": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.113.gate_proj.weight_scale": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.113.up_proj.weight": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.113.up_proj.weight_scale": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.114.down_proj.weight": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.114.down_proj.weight_scale": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.114.gate_proj.weight": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.114.gate_proj.weight_scale": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.114.up_proj.weight": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.114.up_proj.weight_scale": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.115.down_proj.weight": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.115.down_proj.weight_scale": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.115.gate_proj.weight": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.115.gate_proj.weight_scale": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.115.up_proj.weight": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.115.up_proj.weight_scale": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.116.down_proj.weight": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.116.down_proj.weight_scale": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.116.gate_proj.weight": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.116.gate_proj.weight_scale": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.116.up_proj.weight": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.116.up_proj.weight_scale": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.117.down_proj.weight": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.117.down_proj.weight_scale": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.117.gate_proj.weight": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.117.gate_proj.weight_scale": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.117.up_proj.weight": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.117.up_proj.weight_scale": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.118.down_proj.weight": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.118.down_proj.weight_scale": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.118.gate_proj.weight": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.118.gate_proj.weight_scale": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.118.up_proj.weight": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.118.up_proj.weight_scale": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.119.down_proj.weight": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.119.down_proj.weight_scale": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.119.gate_proj.weight": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.119.gate_proj.weight_scale": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.119.up_proj.weight": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.119.up_proj.weight_scale": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.12.down_proj.weight": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.12.down_proj.weight_scale": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.12.gate_proj.weight": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.12.gate_proj.weight_scale": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.12.up_proj.weight": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.12.up_proj.weight_scale": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.120.down_proj.weight": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.120.down_proj.weight_scale": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.120.gate_proj.weight": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.120.gate_proj.weight_scale": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.120.up_proj.weight": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.120.up_proj.weight_scale": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.121.down_proj.weight": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.121.down_proj.weight_scale": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.121.gate_proj.weight": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.121.gate_proj.weight_scale": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.121.up_proj.weight": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.121.up_proj.weight_scale": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.122.down_proj.weight": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.122.down_proj.weight_scale": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.122.gate_proj.weight": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.122.gate_proj.weight_scale": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.122.up_proj.weight": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.122.up_proj.weight_scale": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.123.down_proj.weight": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.123.down_proj.weight_scale": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.123.gate_proj.weight": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.123.gate_proj.weight_scale": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.123.up_proj.weight": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.123.up_proj.weight_scale": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.124.down_proj.weight": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.124.down_proj.weight_scale": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.124.gate_proj.weight": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.124.gate_proj.weight_scale": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.124.up_proj.weight": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.124.up_proj.weight_scale": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.125.down_proj.weight": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.125.down_proj.weight_scale": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.125.gate_proj.weight": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.125.gate_proj.weight_scale": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.125.up_proj.weight": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.125.up_proj.weight_scale": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.126.down_proj.weight": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.126.down_proj.weight_scale": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.126.gate_proj.weight": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.126.gate_proj.weight_scale": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.126.up_proj.weight": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.126.up_proj.weight_scale": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.127.down_proj.weight": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.127.down_proj.weight_scale": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.127.gate_proj.weight": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.127.gate_proj.weight_scale": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.127.up_proj.weight": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.127.up_proj.weight_scale": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.128.down_proj.weight": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.128.down_proj.weight_scale": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.128.gate_proj.weight": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.128.gate_proj.weight_scale": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.128.up_proj.weight": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.128.up_proj.weight_scale": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.129.down_proj.weight": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.129.down_proj.weight_scale": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.129.gate_proj.weight": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.129.gate_proj.weight_scale": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.129.up_proj.weight": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.129.up_proj.weight_scale": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.13.down_proj.weight": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.13.down_proj.weight_scale": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.13.gate_proj.weight": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.13.gate_proj.weight_scale": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.13.up_proj.weight": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.13.up_proj.weight_scale": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.130.down_proj.weight": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.130.down_proj.weight_scale": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.130.gate_proj.weight": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.130.gate_proj.weight_scale": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.130.up_proj.weight": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.130.up_proj.weight_scale": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.131.down_proj.weight": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.131.down_proj.weight_scale": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.131.gate_proj.weight": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.131.gate_proj.weight_scale": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.131.up_proj.weight": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.131.up_proj.weight_scale": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.132.down_proj.weight": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.132.down_proj.weight_scale": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.132.gate_proj.weight": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.132.gate_proj.weight_scale": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.132.up_proj.weight": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.132.up_proj.weight_scale": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.133.down_proj.weight": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.133.down_proj.weight_scale": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.133.gate_proj.weight": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.133.gate_proj.weight_scale": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.133.up_proj.weight": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.133.up_proj.weight_scale": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.134.down_proj.weight": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.134.down_proj.weight_scale": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.134.gate_proj.weight": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.134.gate_proj.weight_scale": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.134.up_proj.weight": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.134.up_proj.weight_scale": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.135.down_proj.weight": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.135.down_proj.weight_scale": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.135.gate_proj.weight": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.135.gate_proj.weight_scale": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.135.up_proj.weight": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.135.up_proj.weight_scale": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.136.down_proj.weight": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.136.down_proj.weight_scale": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.136.gate_proj.weight": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.136.gate_proj.weight_scale": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.136.up_proj.weight": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.136.up_proj.weight_scale": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.137.down_proj.weight": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.137.down_proj.weight_scale": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.137.gate_proj.weight": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.137.gate_proj.weight_scale": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.137.up_proj.weight": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.137.up_proj.weight_scale": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.138.down_proj.weight": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.138.down_proj.weight_scale": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.138.gate_proj.weight": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.138.gate_proj.weight_scale": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.138.up_proj.weight": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.138.up_proj.weight_scale": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.139.down_proj.weight": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.139.down_proj.weight_scale": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.139.gate_proj.weight": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.139.gate_proj.weight_scale": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.139.up_proj.weight": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.139.up_proj.weight_scale": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.14.down_proj.weight": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.14.down_proj.weight_scale": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.14.gate_proj.weight": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.14.gate_proj.weight_scale": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.14.up_proj.weight": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.14.up_proj.weight_scale": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.140.down_proj.weight": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.140.down_proj.weight_scale": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.140.gate_proj.weight": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.140.gate_proj.weight_scale": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.140.up_proj.weight": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.140.up_proj.weight_scale": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.141.down_proj.weight": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.141.down_proj.weight_scale": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.141.gate_proj.weight": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.141.gate_proj.weight_scale": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.141.up_proj.weight": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.141.up_proj.weight_scale": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.142.down_proj.weight": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.142.down_proj.weight_scale": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.142.gate_proj.weight": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.142.gate_proj.weight_scale": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.142.up_proj.weight": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.142.up_proj.weight_scale": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.143.down_proj.weight": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.143.down_proj.weight_scale": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.143.gate_proj.weight": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.143.gate_proj.weight_scale": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.143.up_proj.weight": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.143.up_proj.weight_scale": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.144.down_proj.weight": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.144.down_proj.weight_scale": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.144.gate_proj.weight": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.144.gate_proj.weight_scale": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.144.up_proj.weight": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.144.up_proj.weight_scale": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.145.down_proj.weight": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.145.down_proj.weight_scale": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.145.gate_proj.weight": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.145.gate_proj.weight_scale": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.145.up_proj.weight": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.145.up_proj.weight_scale": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.146.down_proj.weight": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.146.down_proj.weight_scale": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.146.gate_proj.weight": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.146.gate_proj.weight_scale": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.146.up_proj.weight": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.146.up_proj.weight_scale": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.147.down_proj.weight": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.147.down_proj.weight_scale": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.147.gate_proj.weight": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.147.gate_proj.weight_scale": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.147.up_proj.weight": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.147.up_proj.weight_scale": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.148.down_proj.weight": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.148.down_proj.weight_scale": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.148.gate_proj.weight": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.148.gate_proj.weight_scale": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.148.up_proj.weight": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.148.up_proj.weight_scale": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.149.down_proj.weight": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.149.down_proj.weight_scale": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.149.gate_proj.weight": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.149.gate_proj.weight_scale": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.149.up_proj.weight": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.149.up_proj.weight_scale": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.15.down_proj.weight": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.15.down_proj.weight_scale": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.15.gate_proj.weight": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.15.gate_proj.weight_scale": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.15.up_proj.weight": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.15.up_proj.weight_scale": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.150.down_proj.weight": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.150.down_proj.weight_scale": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.150.gate_proj.weight": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.150.gate_proj.weight_scale": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.150.up_proj.weight": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.150.up_proj.weight_scale": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.151.down_proj.weight": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.151.down_proj.weight_scale": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.151.gate_proj.weight": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.151.gate_proj.weight_scale": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.151.up_proj.weight": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.151.up_proj.weight_scale": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.152.down_proj.weight": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.152.down_proj.weight_scale": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.152.gate_proj.weight": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.152.gate_proj.weight_scale": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.152.up_proj.weight": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.152.up_proj.weight_scale": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.153.down_proj.weight": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.153.down_proj.weight_scale": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.153.gate_proj.weight": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.153.gate_proj.weight_scale": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.153.up_proj.weight": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.153.up_proj.weight_scale": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.154.down_proj.weight": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.154.down_proj.weight_scale": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.154.gate_proj.weight": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.154.gate_proj.weight_scale": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.154.up_proj.weight": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.154.up_proj.weight_scale": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.155.down_proj.weight": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.155.down_proj.weight_scale": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.155.gate_proj.weight": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.155.gate_proj.weight_scale": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.155.up_proj.weight": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.155.up_proj.weight_scale": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.156.down_proj.weight": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.156.down_proj.weight_scale": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.156.gate_proj.weight": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.156.gate_proj.weight_scale": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.156.up_proj.weight": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.156.up_proj.weight_scale": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.157.down_proj.weight": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.157.down_proj.weight_scale": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.157.gate_proj.weight": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.157.gate_proj.weight_scale": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.157.up_proj.weight": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.157.up_proj.weight_scale": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.158.down_proj.weight": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.158.down_proj.weight_scale": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.158.gate_proj.weight": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.158.gate_proj.weight_scale": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.158.up_proj.weight": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.158.up_proj.weight_scale": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.159.down_proj.weight": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.159.down_proj.weight_scale": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.159.gate_proj.weight": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.159.gate_proj.weight_scale": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.159.up_proj.weight": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.159.up_proj.weight_scale": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.16.down_proj.weight": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.16.down_proj.weight_scale": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.16.gate_proj.weight": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.16.gate_proj.weight_scale": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.16.up_proj.weight": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.16.up_proj.weight_scale": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.17.down_proj.weight": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.17.down_proj.weight_scale": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.17.gate_proj.weight": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.17.gate_proj.weight_scale": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.17.up_proj.weight": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.17.up_proj.weight_scale": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.18.down_proj.weight": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.18.down_proj.weight_scale": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.18.gate_proj.weight": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.18.gate_proj.weight_scale": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.18.up_proj.weight": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.18.up_proj.weight_scale": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.19.down_proj.weight": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.19.down_proj.weight_scale": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.19.gate_proj.weight": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.19.gate_proj.weight_scale": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.19.up_proj.weight": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.19.up_proj.weight_scale": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.2.down_proj.weight": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.2.down_proj.weight_scale": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.2.gate_proj.weight": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.2.gate_proj.weight_scale": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.2.up_proj.weight": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.2.up_proj.weight_scale": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.20.down_proj.weight": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.20.down_proj.weight_scale": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.20.gate_proj.weight": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.20.gate_proj.weight_scale": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.20.up_proj.weight": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.20.up_proj.weight_scale": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.21.down_proj.weight": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.21.down_proj.weight_scale": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.21.gate_proj.weight": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.21.gate_proj.weight_scale": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.21.up_proj.weight": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.21.up_proj.weight_scale": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.22.down_proj.weight": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.22.down_proj.weight_scale": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.22.gate_proj.weight": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.22.gate_proj.weight_scale": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.22.up_proj.weight": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.22.up_proj.weight_scale": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.23.down_proj.weight": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.23.down_proj.weight_scale": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.23.gate_proj.weight": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.23.gate_proj.weight_scale": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.23.up_proj.weight": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.23.up_proj.weight_scale": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.24.down_proj.weight": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.24.down_proj.weight_scale": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.24.gate_proj.weight": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.24.gate_proj.weight_scale": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.24.up_proj.weight": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.24.up_proj.weight_scale": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.25.down_proj.weight": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.25.down_proj.weight_scale": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.25.gate_proj.weight": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.25.gate_proj.weight_scale": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.25.up_proj.weight": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.25.up_proj.weight_scale": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.26.down_proj.weight": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.26.down_proj.weight_scale": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.26.gate_proj.weight": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.26.gate_proj.weight_scale": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.26.up_proj.weight": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.26.up_proj.weight_scale": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.27.down_proj.weight": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.27.down_proj.weight_scale": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.27.gate_proj.weight": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.27.gate_proj.weight_scale": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.27.up_proj.weight": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.27.up_proj.weight_scale": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.28.down_proj.weight": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.28.down_proj.weight_scale": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.28.gate_proj.weight": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.28.gate_proj.weight_scale": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.28.up_proj.weight": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.28.up_proj.weight_scale": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.29.down_proj.weight": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.29.down_proj.weight_scale": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.29.gate_proj.weight": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.29.gate_proj.weight_scale": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.29.up_proj.weight": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.29.up_proj.weight_scale": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.3.down_proj.weight": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.3.down_proj.weight_scale": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.3.gate_proj.weight": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.3.gate_proj.weight_scale": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.3.up_proj.weight": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.3.up_proj.weight_scale": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.30.down_proj.weight": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.30.down_proj.weight_scale": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.30.gate_proj.weight": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.30.gate_proj.weight_scale": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.30.up_proj.weight": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.30.up_proj.weight_scale": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.31.down_proj.weight": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.31.down_proj.weight_scale": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.31.gate_proj.weight": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.31.gate_proj.weight_scale": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.31.up_proj.weight": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.31.up_proj.weight_scale": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.32.down_proj.weight": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.32.down_proj.weight_scale": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.32.gate_proj.weight": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.32.gate_proj.weight_scale": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.32.up_proj.weight": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.32.up_proj.weight_scale": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.33.down_proj.weight": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.33.down_proj.weight_scale": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.33.gate_proj.weight": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.33.gate_proj.weight_scale": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.33.up_proj.weight": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.33.up_proj.weight_scale": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.34.down_proj.weight": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.34.down_proj.weight_scale": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.34.gate_proj.weight": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.34.gate_proj.weight_scale": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.34.up_proj.weight": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.34.up_proj.weight_scale": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.35.down_proj.weight": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.35.down_proj.weight_scale": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.35.gate_proj.weight": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.35.gate_proj.weight_scale": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.35.up_proj.weight": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.35.up_proj.weight_scale": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.36.down_proj.weight": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.36.down_proj.weight_scale": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.36.gate_proj.weight": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.36.gate_proj.weight_scale": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.36.up_proj.weight": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.36.up_proj.weight_scale": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.37.down_proj.weight": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.37.down_proj.weight_scale": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.37.gate_proj.weight": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.37.gate_proj.weight_scale": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.37.up_proj.weight": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.37.up_proj.weight_scale": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.38.down_proj.weight": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.38.down_proj.weight_scale": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.38.gate_proj.weight": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.38.gate_proj.weight_scale": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.38.up_proj.weight": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.38.up_proj.weight_scale": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.39.down_proj.weight": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.39.down_proj.weight_scale": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.39.gate_proj.weight": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.39.gate_proj.weight_scale": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.39.up_proj.weight": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.39.up_proj.weight_scale": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.4.down_proj.weight": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.4.down_proj.weight_scale": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.4.gate_proj.weight": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.4.gate_proj.weight_scale": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.4.up_proj.weight": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.4.up_proj.weight_scale": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.40.down_proj.weight": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.40.down_proj.weight_scale": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.40.gate_proj.weight": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.40.gate_proj.weight_scale": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.40.up_proj.weight": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.40.up_proj.weight_scale": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.41.down_proj.weight": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.41.down_proj.weight_scale": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.41.gate_proj.weight": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.41.gate_proj.weight_scale": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.41.up_proj.weight": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.41.up_proj.weight_scale": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.42.down_proj.weight": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.42.down_proj.weight_scale": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.42.gate_proj.weight": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.42.gate_proj.weight_scale": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.42.up_proj.weight": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.42.up_proj.weight_scale": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.43.down_proj.weight": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.43.down_proj.weight_scale": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.43.gate_proj.weight": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.43.gate_proj.weight_scale": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.43.up_proj.weight": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.43.up_proj.weight_scale": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.44.down_proj.weight": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.44.down_proj.weight_scale": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.44.gate_proj.weight": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.44.gate_proj.weight_scale": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.44.up_proj.weight": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.44.up_proj.weight_scale": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.45.down_proj.weight": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.45.down_proj.weight_scale": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.45.gate_proj.weight": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.45.gate_proj.weight_scale": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.45.up_proj.weight": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.45.up_proj.weight_scale": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.46.down_proj.weight": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.46.down_proj.weight_scale": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.46.gate_proj.weight": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.46.gate_proj.weight_scale": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.46.up_proj.weight": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.46.up_proj.weight_scale": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.47.down_proj.weight": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.47.down_proj.weight_scale": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.47.gate_proj.weight": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.47.gate_proj.weight_scale": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.47.up_proj.weight": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.47.up_proj.weight_scale": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.48.down_proj.weight": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.48.down_proj.weight_scale": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.48.gate_proj.weight": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.48.gate_proj.weight_scale": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.48.up_proj.weight": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.48.up_proj.weight_scale": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.49.down_proj.weight": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.49.down_proj.weight_scale": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.49.gate_proj.weight": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.49.gate_proj.weight_scale": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.49.up_proj.weight": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.49.up_proj.weight_scale": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.5.down_proj.weight": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.5.down_proj.weight_scale": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.5.gate_proj.weight": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.5.gate_proj.weight_scale": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.5.up_proj.weight": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.5.up_proj.weight_scale": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.50.down_proj.weight": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.50.down_proj.weight_scale": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.50.gate_proj.weight": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.50.gate_proj.weight_scale": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.50.up_proj.weight": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.50.up_proj.weight_scale": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.51.down_proj.weight": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.51.down_proj.weight_scale": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.51.gate_proj.weight": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.51.gate_proj.weight_scale": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.51.up_proj.weight": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.51.up_proj.weight_scale": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.52.down_proj.weight": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.52.down_proj.weight_scale": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.52.gate_proj.weight": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.52.gate_proj.weight_scale": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.52.up_proj.weight": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.52.up_proj.weight_scale": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.53.down_proj.weight": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.53.down_proj.weight_scale": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.53.gate_proj.weight": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.53.gate_proj.weight_scale": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.53.up_proj.weight": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.53.up_proj.weight_scale": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.54.down_proj.weight": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.54.down_proj.weight_scale": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.54.gate_proj.weight": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.54.gate_proj.weight_scale": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.54.up_proj.weight": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.54.up_proj.weight_scale": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.55.down_proj.weight": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.55.down_proj.weight_scale": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.55.gate_proj.weight": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.55.gate_proj.weight_scale": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.55.up_proj.weight": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.55.up_proj.weight_scale": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.56.down_proj.weight": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.56.down_proj.weight_scale": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.56.gate_proj.weight": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.56.gate_proj.weight_scale": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.56.up_proj.weight": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.56.up_proj.weight_scale": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.57.down_proj.weight": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.57.down_proj.weight_scale": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.57.gate_proj.weight": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.57.gate_proj.weight_scale": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.57.up_proj.weight": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.57.up_proj.weight_scale": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.58.down_proj.weight": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.58.down_proj.weight_scale": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.58.gate_proj.weight": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.58.gate_proj.weight_scale": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.58.up_proj.weight": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.58.up_proj.weight_scale": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.59.down_proj.weight": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.59.down_proj.weight_scale": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.59.gate_proj.weight": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.59.gate_proj.weight_scale": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.59.up_proj.weight": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.59.up_proj.weight_scale": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.6.down_proj.weight": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.6.down_proj.weight_scale": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.6.gate_proj.weight": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.6.gate_proj.weight_scale": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.6.up_proj.weight": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.6.up_proj.weight_scale": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.60.down_proj.weight": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.60.down_proj.weight_scale": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.60.gate_proj.weight": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.60.gate_proj.weight_scale": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.60.up_proj.weight": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.60.up_proj.weight_scale": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.61.down_proj.weight": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.61.down_proj.weight_scale": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.61.gate_proj.weight": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.61.gate_proj.weight_scale": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.61.up_proj.weight": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.61.up_proj.weight_scale": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.62.down_proj.weight": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.62.down_proj.weight_scale": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.62.gate_proj.weight": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.62.gate_proj.weight_scale": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.62.up_proj.weight": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.62.up_proj.weight_scale": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.63.down_proj.weight": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.63.down_proj.weight_scale": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.63.gate_proj.weight": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.63.gate_proj.weight_scale": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.63.up_proj.weight": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.63.up_proj.weight_scale": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.64.down_proj.weight": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.64.down_proj.weight_scale": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.64.gate_proj.weight": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.64.gate_proj.weight_scale": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.64.up_proj.weight": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.64.up_proj.weight_scale": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.65.down_proj.weight": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.65.down_proj.weight_scale": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.65.gate_proj.weight": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.65.gate_proj.weight_scale": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.65.up_proj.weight": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.65.up_proj.weight_scale": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.66.down_proj.weight": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.66.down_proj.weight_scale": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.66.gate_proj.weight": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.66.gate_proj.weight_scale": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.66.up_proj.weight": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.66.up_proj.weight_scale": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.67.down_proj.weight": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.67.down_proj.weight_scale": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.67.gate_proj.weight": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.67.gate_proj.weight_scale": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.67.up_proj.weight": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.67.up_proj.weight_scale": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.68.down_proj.weight": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.68.down_proj.weight_scale": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.68.gate_proj.weight": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.68.gate_proj.weight_scale": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.68.up_proj.weight": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.68.up_proj.weight_scale": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.69.down_proj.weight": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.69.down_proj.weight_scale": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.69.gate_proj.weight": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.69.gate_proj.weight_scale": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.69.up_proj.weight": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.69.up_proj.weight_scale": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.7.down_proj.weight": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.7.down_proj.weight_scale": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.7.gate_proj.weight": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.7.gate_proj.weight_scale": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.7.up_proj.weight": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.7.up_proj.weight_scale": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.70.down_proj.weight": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.70.down_proj.weight_scale": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.70.gate_proj.weight": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.70.gate_proj.weight_scale": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.70.up_proj.weight": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.70.up_proj.weight_scale": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.71.down_proj.weight": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.71.down_proj.weight_scale": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.71.gate_proj.weight": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.71.gate_proj.weight_scale": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.71.up_proj.weight": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.71.up_proj.weight_scale": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.72.down_proj.weight": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.72.down_proj.weight_scale": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.72.gate_proj.weight": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.72.gate_proj.weight_scale": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.72.up_proj.weight": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.72.up_proj.weight_scale": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.73.down_proj.weight": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.73.down_proj.weight_scale": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.73.gate_proj.weight": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.73.gate_proj.weight_scale": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.73.up_proj.weight": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.73.up_proj.weight_scale": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.74.down_proj.weight": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.74.down_proj.weight_scale": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.74.gate_proj.weight": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.74.gate_proj.weight_scale": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.74.up_proj.weight": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.74.up_proj.weight_scale": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.75.down_proj.weight": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.75.down_proj.weight_scale": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.75.gate_proj.weight": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.75.gate_proj.weight_scale": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.75.up_proj.weight": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.75.up_proj.weight_scale": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.76.down_proj.weight": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.76.down_proj.weight_scale": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.76.gate_proj.weight": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.76.gate_proj.weight_scale": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.76.up_proj.weight": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.76.up_proj.weight_scale": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.77.down_proj.weight": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.77.down_proj.weight_scale": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.77.gate_proj.weight": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.77.gate_proj.weight_scale": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.77.up_proj.weight": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.77.up_proj.weight_scale": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.78.down_proj.weight": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.78.down_proj.weight_scale": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.78.gate_proj.weight": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.78.gate_proj.weight_scale": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.78.up_proj.weight": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.78.up_proj.weight_scale": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.79.down_proj.weight": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.79.down_proj.weight_scale": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.79.gate_proj.weight": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.79.gate_proj.weight_scale": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.79.up_proj.weight": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.79.up_proj.weight_scale": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.8.down_proj.weight": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.8.down_proj.weight_scale": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.8.gate_proj.weight": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.8.gate_proj.weight_scale": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.8.up_proj.weight": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.8.up_proj.weight_scale": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.80.down_proj.weight": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.80.down_proj.weight_scale": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.80.gate_proj.weight": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.80.gate_proj.weight_scale": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.80.up_proj.weight": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.80.up_proj.weight_scale": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.81.down_proj.weight": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.81.down_proj.weight_scale": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.81.gate_proj.weight": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.81.gate_proj.weight_scale": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.81.up_proj.weight": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.81.up_proj.weight_scale": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.82.down_proj.weight": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.82.down_proj.weight_scale": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.82.gate_proj.weight": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.82.gate_proj.weight_scale": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.82.up_proj.weight": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.82.up_proj.weight_scale": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.83.down_proj.weight": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.83.down_proj.weight_scale": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.83.gate_proj.weight": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.83.gate_proj.weight_scale": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.83.up_proj.weight": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.83.up_proj.weight_scale": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.84.down_proj.weight": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.84.down_proj.weight_scale": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.84.gate_proj.weight": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.84.gate_proj.weight_scale": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.84.up_proj.weight": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.84.up_proj.weight_scale": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.85.down_proj.weight": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.85.down_proj.weight_scale": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.85.gate_proj.weight": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.85.gate_proj.weight_scale": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.85.up_proj.weight": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.85.up_proj.weight_scale": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.86.down_proj.weight": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.86.down_proj.weight_scale": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.86.gate_proj.weight": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.86.gate_proj.weight_scale": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.86.up_proj.weight": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.86.up_proj.weight_scale": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.87.down_proj.weight": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.87.down_proj.weight_scale": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.87.gate_proj.weight": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.87.gate_proj.weight_scale": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.87.up_proj.weight": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.87.up_proj.weight_scale": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.88.down_proj.weight": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.88.down_proj.weight_scale": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.88.gate_proj.weight": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.88.gate_proj.weight_scale": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.88.up_proj.weight": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.88.up_proj.weight_scale": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.89.down_proj.weight": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.89.down_proj.weight_scale": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.89.gate_proj.weight": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.89.gate_proj.weight_scale": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.89.up_proj.weight": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.89.up_proj.weight_scale": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.9.down_proj.weight": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.9.down_proj.weight_scale": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.9.gate_proj.weight": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.9.gate_proj.weight_scale": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.9.up_proj.weight": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.9.up_proj.weight_scale": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.90.down_proj.weight": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.90.down_proj.weight_scale": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.90.gate_proj.weight": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.90.gate_proj.weight_scale": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.90.up_proj.weight": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.90.up_proj.weight_scale": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.91.down_proj.weight": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.91.down_proj.weight_scale": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.91.gate_proj.weight": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.91.gate_proj.weight_scale": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.91.up_proj.weight": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.91.up_proj.weight_scale": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.92.down_proj.weight": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.92.down_proj.weight_scale": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.92.gate_proj.weight": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.92.gate_proj.weight_scale": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.92.up_proj.weight": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.92.up_proj.weight_scale": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.93.down_proj.weight": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.93.down_proj.weight_scale": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.93.gate_proj.weight": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.93.gate_proj.weight_scale": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.93.up_proj.weight": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.93.up_proj.weight_scale": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.94.down_proj.weight": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.94.down_proj.weight_scale": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.94.gate_proj.weight": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.94.gate_proj.weight_scale": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.94.up_proj.weight": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.94.up_proj.weight_scale": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.95.down_proj.weight": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.95.down_proj.weight_scale": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.95.gate_proj.weight": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.95.gate_proj.weight_scale": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.95.up_proj.weight": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.95.up_proj.weight_scale": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.96.down_proj.weight": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.96.down_proj.weight_scale": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.96.gate_proj.weight": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.96.gate_proj.weight_scale": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.96.up_proj.weight": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.96.up_proj.weight_scale": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.97.down_proj.weight": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.97.down_proj.weight_scale": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.97.gate_proj.weight": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.97.gate_proj.weight_scale": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.97.up_proj.weight": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.97.up_proj.weight_scale": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.98.down_proj.weight": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.98.down_proj.weight_scale": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.98.gate_proj.weight": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.98.gate_proj.weight_scale": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.98.up_proj.weight": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.98.up_proj.weight_scale": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.99.down_proj.weight": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.99.down_proj.weight_scale": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.99.gate_proj.weight": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.99.gate_proj.weight_scale": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.99.up_proj.weight": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.99.up_proj.weight_scale": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.gate.e_score_correction_bias": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.gate.weight": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.shared_experts.down_proj.weight": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.shared_experts.down_proj.weight_scale": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.shared_experts.gate_proj.weight": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.shared_experts.gate_proj.weight_scale": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.shared_experts.up_proj.weight": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.shared_experts.up_proj.weight_scale": "model-00052-of-00092.safetensors",
+ "model.layers.51.post_attention_layernorm.weight": "model-00052-of-00092.safetensors",
+ "model.layers.51.self_attn.k_norm.weight": "model-00052-of-00092.safetensors",
+ "model.layers.51.self_attn.k_proj.bias": "model-00052-of-00092.safetensors",
+ "model.layers.51.self_attn.k_proj.weight": "model-00052-of-00092.safetensors",
+ "model.layers.51.self_attn.k_proj.weight_scale": "model-00052-of-00092.safetensors",
+ "model.layers.51.self_attn.o_proj.weight": "model-00052-of-00092.safetensors",
+ "model.layers.51.self_attn.o_proj.weight_scale": "model-00052-of-00092.safetensors",
+ "model.layers.51.self_attn.q_norm.weight": "model-00052-of-00092.safetensors",
+ "model.layers.51.self_attn.q_proj.bias": "model-00052-of-00092.safetensors",
+ "model.layers.51.self_attn.q_proj.weight": "model-00052-of-00092.safetensors",
+ "model.layers.51.self_attn.q_proj.weight_scale": "model-00052-of-00092.safetensors",
+ "model.layers.51.self_attn.v_proj.bias": "model-00052-of-00092.safetensors",
+ "model.layers.51.self_attn.v_proj.weight": "model-00052-of-00092.safetensors",
+ "model.layers.51.self_attn.v_proj.weight_scale": "model-00052-of-00092.safetensors",
+ "model.layers.52.input_layernorm.weight": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.0.down_proj.weight": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.0.down_proj.weight_scale": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.0.gate_proj.weight": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.0.gate_proj.weight_scale": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.0.up_proj.weight": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.0.up_proj.weight_scale": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.1.down_proj.weight": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.1.down_proj.weight_scale": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.1.gate_proj.weight": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.1.gate_proj.weight_scale": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.1.up_proj.weight": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.1.up_proj.weight_scale": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.10.down_proj.weight": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.10.down_proj.weight_scale": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.10.gate_proj.weight": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.10.gate_proj.weight_scale": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.10.up_proj.weight": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.10.up_proj.weight_scale": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.100.down_proj.weight": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.100.down_proj.weight_scale": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.100.gate_proj.weight": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.100.gate_proj.weight_scale": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.100.up_proj.weight": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.100.up_proj.weight_scale": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.101.down_proj.weight": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.101.down_proj.weight_scale": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.101.gate_proj.weight": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.101.gate_proj.weight_scale": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.101.up_proj.weight": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.101.up_proj.weight_scale": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.102.down_proj.weight": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.102.down_proj.weight_scale": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.102.gate_proj.weight": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.102.gate_proj.weight_scale": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.102.up_proj.weight": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.102.up_proj.weight_scale": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.103.down_proj.weight": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.103.down_proj.weight_scale": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.103.gate_proj.weight": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.103.gate_proj.weight_scale": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.103.up_proj.weight": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.103.up_proj.weight_scale": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.104.down_proj.weight": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.104.down_proj.weight_scale": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.104.gate_proj.weight": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.104.gate_proj.weight_scale": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.104.up_proj.weight": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.104.up_proj.weight_scale": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.105.down_proj.weight": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.105.down_proj.weight_scale": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.105.gate_proj.weight": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.105.gate_proj.weight_scale": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.105.up_proj.weight": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.105.up_proj.weight_scale": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.106.down_proj.weight": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.106.down_proj.weight_scale": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.106.gate_proj.weight": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.106.gate_proj.weight_scale": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.106.up_proj.weight": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.106.up_proj.weight_scale": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.107.down_proj.weight": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.107.down_proj.weight_scale": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.107.gate_proj.weight": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.107.gate_proj.weight_scale": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.107.up_proj.weight": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.107.up_proj.weight_scale": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.108.down_proj.weight": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.108.down_proj.weight_scale": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.108.gate_proj.weight": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.108.gate_proj.weight_scale": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.108.up_proj.weight": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.108.up_proj.weight_scale": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.109.down_proj.weight": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.109.down_proj.weight_scale": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.109.gate_proj.weight": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.109.gate_proj.weight_scale": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.109.up_proj.weight": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.109.up_proj.weight_scale": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.11.down_proj.weight": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.11.down_proj.weight_scale": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.11.gate_proj.weight": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.11.gate_proj.weight_scale": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.11.up_proj.weight": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.11.up_proj.weight_scale": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.110.down_proj.weight": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.110.down_proj.weight_scale": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.110.gate_proj.weight": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.110.gate_proj.weight_scale": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.110.up_proj.weight": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.110.up_proj.weight_scale": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.111.down_proj.weight": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.111.down_proj.weight_scale": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.111.gate_proj.weight": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.111.gate_proj.weight_scale": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.111.up_proj.weight": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.111.up_proj.weight_scale": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.112.down_proj.weight": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.112.down_proj.weight_scale": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.112.gate_proj.weight": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.112.gate_proj.weight_scale": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.112.up_proj.weight": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.112.up_proj.weight_scale": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.113.down_proj.weight": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.113.down_proj.weight_scale": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.113.gate_proj.weight": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.113.gate_proj.weight_scale": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.113.up_proj.weight": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.113.up_proj.weight_scale": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.114.down_proj.weight": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.114.down_proj.weight_scale": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.114.gate_proj.weight": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.114.gate_proj.weight_scale": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.114.up_proj.weight": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.114.up_proj.weight_scale": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.115.down_proj.weight": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.115.down_proj.weight_scale": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.115.gate_proj.weight": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.115.gate_proj.weight_scale": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.115.up_proj.weight": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.115.up_proj.weight_scale": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.116.down_proj.weight": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.116.down_proj.weight_scale": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.116.gate_proj.weight": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.116.gate_proj.weight_scale": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.116.up_proj.weight": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.116.up_proj.weight_scale": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.117.down_proj.weight": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.117.down_proj.weight_scale": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.117.gate_proj.weight": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.117.gate_proj.weight_scale": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.117.up_proj.weight": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.117.up_proj.weight_scale": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.118.down_proj.weight": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.118.down_proj.weight_scale": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.118.gate_proj.weight": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.118.gate_proj.weight_scale": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.118.up_proj.weight": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.118.up_proj.weight_scale": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.119.down_proj.weight": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.119.down_proj.weight_scale": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.119.gate_proj.weight": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.119.gate_proj.weight_scale": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.119.up_proj.weight": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.119.up_proj.weight_scale": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.12.down_proj.weight": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.12.down_proj.weight_scale": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.12.gate_proj.weight": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.12.gate_proj.weight_scale": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.12.up_proj.weight": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.12.up_proj.weight_scale": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.120.down_proj.weight": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.120.down_proj.weight_scale": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.120.gate_proj.weight": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.120.gate_proj.weight_scale": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.120.up_proj.weight": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.120.up_proj.weight_scale": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.121.down_proj.weight": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.121.down_proj.weight_scale": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.121.gate_proj.weight": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.121.gate_proj.weight_scale": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.121.up_proj.weight": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.121.up_proj.weight_scale": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.122.down_proj.weight": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.122.down_proj.weight_scale": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.122.gate_proj.weight": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.122.gate_proj.weight_scale": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.122.up_proj.weight": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.122.up_proj.weight_scale": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.123.down_proj.weight": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.123.down_proj.weight_scale": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.123.gate_proj.weight": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.123.gate_proj.weight_scale": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.123.up_proj.weight": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.123.up_proj.weight_scale": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.124.down_proj.weight": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.124.down_proj.weight_scale": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.124.gate_proj.weight": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.124.gate_proj.weight_scale": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.124.up_proj.weight": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.124.up_proj.weight_scale": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.125.down_proj.weight": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.125.down_proj.weight_scale": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.125.gate_proj.weight": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.125.gate_proj.weight_scale": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.125.up_proj.weight": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.125.up_proj.weight_scale": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.126.down_proj.weight": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.126.down_proj.weight_scale": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.126.gate_proj.weight": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.126.gate_proj.weight_scale": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.126.up_proj.weight": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.126.up_proj.weight_scale": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.127.down_proj.weight": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.127.down_proj.weight_scale": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.127.gate_proj.weight": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.127.gate_proj.weight_scale": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.127.up_proj.weight": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.127.up_proj.weight_scale": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.128.down_proj.weight": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.128.down_proj.weight_scale": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.128.gate_proj.weight": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.128.gate_proj.weight_scale": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.128.up_proj.weight": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.128.up_proj.weight_scale": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.129.down_proj.weight": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.129.down_proj.weight_scale": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.129.gate_proj.weight": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.129.gate_proj.weight_scale": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.129.up_proj.weight": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.129.up_proj.weight_scale": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.13.down_proj.weight": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.13.down_proj.weight_scale": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.13.gate_proj.weight": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.13.gate_proj.weight_scale": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.13.up_proj.weight": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.13.up_proj.weight_scale": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.130.down_proj.weight": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.130.down_proj.weight_scale": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.130.gate_proj.weight": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.130.gate_proj.weight_scale": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.130.up_proj.weight": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.130.up_proj.weight_scale": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.131.down_proj.weight": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.131.down_proj.weight_scale": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.131.gate_proj.weight": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.131.gate_proj.weight_scale": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.131.up_proj.weight": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.131.up_proj.weight_scale": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.132.down_proj.weight": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.132.down_proj.weight_scale": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.132.gate_proj.weight": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.132.gate_proj.weight_scale": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.132.up_proj.weight": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.132.up_proj.weight_scale": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.133.down_proj.weight": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.133.down_proj.weight_scale": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.133.gate_proj.weight": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.133.gate_proj.weight_scale": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.133.up_proj.weight": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.133.up_proj.weight_scale": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.134.down_proj.weight": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.134.down_proj.weight_scale": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.134.gate_proj.weight": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.134.gate_proj.weight_scale": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.134.up_proj.weight": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.134.up_proj.weight_scale": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.135.down_proj.weight": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.135.down_proj.weight_scale": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.135.gate_proj.weight": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.135.gate_proj.weight_scale": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.135.up_proj.weight": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.135.up_proj.weight_scale": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.136.down_proj.weight": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.136.down_proj.weight_scale": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.136.gate_proj.weight": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.136.gate_proj.weight_scale": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.136.up_proj.weight": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.136.up_proj.weight_scale": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.137.down_proj.weight": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.137.down_proj.weight_scale": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.137.gate_proj.weight": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.137.gate_proj.weight_scale": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.137.up_proj.weight": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.137.up_proj.weight_scale": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.138.down_proj.weight": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.138.down_proj.weight_scale": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.138.gate_proj.weight": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.138.gate_proj.weight_scale": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.138.up_proj.weight": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.138.up_proj.weight_scale": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.139.down_proj.weight": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.139.down_proj.weight_scale": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.139.gate_proj.weight": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.139.gate_proj.weight_scale": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.139.up_proj.weight": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.139.up_proj.weight_scale": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.14.down_proj.weight": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.14.down_proj.weight_scale": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.14.gate_proj.weight": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.14.gate_proj.weight_scale": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.14.up_proj.weight": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.14.up_proj.weight_scale": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.140.down_proj.weight": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.140.down_proj.weight_scale": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.140.gate_proj.weight": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.140.gate_proj.weight_scale": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.140.up_proj.weight": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.140.up_proj.weight_scale": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.141.down_proj.weight": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.141.down_proj.weight_scale": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.141.gate_proj.weight": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.141.gate_proj.weight_scale": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.141.up_proj.weight": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.141.up_proj.weight_scale": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.142.down_proj.weight": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.142.down_proj.weight_scale": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.142.gate_proj.weight": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.142.gate_proj.weight_scale": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.142.up_proj.weight": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.142.up_proj.weight_scale": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.143.down_proj.weight": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.143.down_proj.weight_scale": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.143.gate_proj.weight": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.143.gate_proj.weight_scale": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.143.up_proj.weight": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.143.up_proj.weight_scale": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.144.down_proj.weight": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.144.down_proj.weight_scale": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.144.gate_proj.weight": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.144.gate_proj.weight_scale": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.144.up_proj.weight": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.144.up_proj.weight_scale": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.145.down_proj.weight": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.145.down_proj.weight_scale": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.145.gate_proj.weight": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.145.gate_proj.weight_scale": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.145.up_proj.weight": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.145.up_proj.weight_scale": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.146.down_proj.weight": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.146.down_proj.weight_scale": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.146.gate_proj.weight": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.146.gate_proj.weight_scale": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.146.up_proj.weight": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.146.up_proj.weight_scale": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.147.down_proj.weight": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.147.down_proj.weight_scale": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.147.gate_proj.weight": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.147.gate_proj.weight_scale": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.147.up_proj.weight": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.147.up_proj.weight_scale": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.148.down_proj.weight": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.148.down_proj.weight_scale": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.148.gate_proj.weight": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.148.gate_proj.weight_scale": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.148.up_proj.weight": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.148.up_proj.weight_scale": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.149.down_proj.weight": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.149.down_proj.weight_scale": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.149.gate_proj.weight": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.149.gate_proj.weight_scale": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.149.up_proj.weight": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.149.up_proj.weight_scale": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.15.down_proj.weight": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.15.down_proj.weight_scale": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.15.gate_proj.weight": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.15.gate_proj.weight_scale": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.15.up_proj.weight": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.15.up_proj.weight_scale": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.150.down_proj.weight": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.150.down_proj.weight_scale": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.150.gate_proj.weight": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.150.gate_proj.weight_scale": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.150.up_proj.weight": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.150.up_proj.weight_scale": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.151.down_proj.weight": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.151.down_proj.weight_scale": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.151.gate_proj.weight": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.151.gate_proj.weight_scale": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.151.up_proj.weight": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.151.up_proj.weight_scale": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.152.down_proj.weight": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.152.down_proj.weight_scale": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.152.gate_proj.weight": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.152.gate_proj.weight_scale": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.152.up_proj.weight": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.152.up_proj.weight_scale": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.153.down_proj.weight": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.153.down_proj.weight_scale": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.153.gate_proj.weight": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.153.gate_proj.weight_scale": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.153.up_proj.weight": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.153.up_proj.weight_scale": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.154.down_proj.weight": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.154.down_proj.weight_scale": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.154.gate_proj.weight": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.154.gate_proj.weight_scale": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.154.up_proj.weight": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.154.up_proj.weight_scale": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.155.down_proj.weight": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.155.down_proj.weight_scale": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.155.gate_proj.weight": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.155.gate_proj.weight_scale": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.155.up_proj.weight": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.155.up_proj.weight_scale": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.156.down_proj.weight": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.156.down_proj.weight_scale": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.156.gate_proj.weight": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.156.gate_proj.weight_scale": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.156.up_proj.weight": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.156.up_proj.weight_scale": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.157.down_proj.weight": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.157.down_proj.weight_scale": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.157.gate_proj.weight": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.157.gate_proj.weight_scale": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.157.up_proj.weight": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.157.up_proj.weight_scale": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.158.down_proj.weight": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.158.down_proj.weight_scale": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.158.gate_proj.weight": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.158.gate_proj.weight_scale": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.158.up_proj.weight": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.158.up_proj.weight_scale": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.159.down_proj.weight": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.159.down_proj.weight_scale": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.159.gate_proj.weight": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.159.gate_proj.weight_scale": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.159.up_proj.weight": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.159.up_proj.weight_scale": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.16.down_proj.weight": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.16.down_proj.weight_scale": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.16.gate_proj.weight": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.16.gate_proj.weight_scale": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.16.up_proj.weight": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.16.up_proj.weight_scale": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.17.down_proj.weight": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.17.down_proj.weight_scale": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.17.gate_proj.weight": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.17.gate_proj.weight_scale": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.17.up_proj.weight": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.17.up_proj.weight_scale": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.18.down_proj.weight": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.18.down_proj.weight_scale": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.18.gate_proj.weight": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.18.gate_proj.weight_scale": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.18.up_proj.weight": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.18.up_proj.weight_scale": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.19.down_proj.weight": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.19.down_proj.weight_scale": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.19.gate_proj.weight": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.19.gate_proj.weight_scale": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.19.up_proj.weight": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.19.up_proj.weight_scale": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.2.down_proj.weight": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.2.down_proj.weight_scale": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.2.gate_proj.weight": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.2.gate_proj.weight_scale": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.2.up_proj.weight": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.2.up_proj.weight_scale": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.20.down_proj.weight": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.20.down_proj.weight_scale": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.20.gate_proj.weight": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.20.gate_proj.weight_scale": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.20.up_proj.weight": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.20.up_proj.weight_scale": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.21.down_proj.weight": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.21.down_proj.weight_scale": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.21.gate_proj.weight": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.21.gate_proj.weight_scale": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.21.up_proj.weight": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.21.up_proj.weight_scale": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.22.down_proj.weight": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.22.down_proj.weight_scale": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.22.gate_proj.weight": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.22.gate_proj.weight_scale": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.22.up_proj.weight": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.22.up_proj.weight_scale": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.23.down_proj.weight": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.23.down_proj.weight_scale": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.23.gate_proj.weight": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.23.gate_proj.weight_scale": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.23.up_proj.weight": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.23.up_proj.weight_scale": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.24.down_proj.weight": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.24.down_proj.weight_scale": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.24.gate_proj.weight": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.24.gate_proj.weight_scale": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.24.up_proj.weight": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.24.up_proj.weight_scale": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.25.down_proj.weight": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.25.down_proj.weight_scale": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.25.gate_proj.weight": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.25.gate_proj.weight_scale": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.25.up_proj.weight": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.25.up_proj.weight_scale": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.26.down_proj.weight": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.26.down_proj.weight_scale": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.26.gate_proj.weight": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.26.gate_proj.weight_scale": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.26.up_proj.weight": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.26.up_proj.weight_scale": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.27.down_proj.weight": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.27.down_proj.weight_scale": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.27.gate_proj.weight": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.27.gate_proj.weight_scale": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.27.up_proj.weight": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.27.up_proj.weight_scale": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.28.down_proj.weight": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.28.down_proj.weight_scale": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.28.gate_proj.weight": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.28.gate_proj.weight_scale": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.28.up_proj.weight": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.28.up_proj.weight_scale": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.29.down_proj.weight": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.29.down_proj.weight_scale": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.29.gate_proj.weight": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.29.gate_proj.weight_scale": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.29.up_proj.weight": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.29.up_proj.weight_scale": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.3.down_proj.weight": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.3.down_proj.weight_scale": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.3.gate_proj.weight": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.3.gate_proj.weight_scale": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.3.up_proj.weight": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.3.up_proj.weight_scale": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.30.down_proj.weight": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.30.down_proj.weight_scale": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.30.gate_proj.weight": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.30.gate_proj.weight_scale": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.30.up_proj.weight": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.30.up_proj.weight_scale": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.31.down_proj.weight": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.31.down_proj.weight_scale": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.31.gate_proj.weight": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.31.gate_proj.weight_scale": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.31.up_proj.weight": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.31.up_proj.weight_scale": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.32.down_proj.weight": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.32.down_proj.weight_scale": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.32.gate_proj.weight": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.32.gate_proj.weight_scale": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.32.up_proj.weight": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.32.up_proj.weight_scale": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.33.down_proj.weight": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.33.down_proj.weight_scale": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.33.gate_proj.weight": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.33.gate_proj.weight_scale": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.33.up_proj.weight": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.33.up_proj.weight_scale": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.34.down_proj.weight": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.34.down_proj.weight_scale": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.34.gate_proj.weight": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.34.gate_proj.weight_scale": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.34.up_proj.weight": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.34.up_proj.weight_scale": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.35.down_proj.weight": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.35.down_proj.weight_scale": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.35.gate_proj.weight": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.35.gate_proj.weight_scale": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.35.up_proj.weight": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.35.up_proj.weight_scale": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.36.down_proj.weight": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.36.down_proj.weight_scale": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.36.gate_proj.weight": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.36.gate_proj.weight_scale": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.36.up_proj.weight": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.36.up_proj.weight_scale": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.37.down_proj.weight": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.37.down_proj.weight_scale": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.37.gate_proj.weight": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.37.gate_proj.weight_scale": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.37.up_proj.weight": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.37.up_proj.weight_scale": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.38.down_proj.weight": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.38.down_proj.weight_scale": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.38.gate_proj.weight": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.38.gate_proj.weight_scale": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.38.up_proj.weight": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.38.up_proj.weight_scale": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.39.down_proj.weight": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.39.down_proj.weight_scale": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.39.gate_proj.weight": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.39.gate_proj.weight_scale": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.39.up_proj.weight": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.39.up_proj.weight_scale": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.4.down_proj.weight": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.4.down_proj.weight_scale": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.4.gate_proj.weight": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.4.gate_proj.weight_scale": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.4.up_proj.weight": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.4.up_proj.weight_scale": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.40.down_proj.weight": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.40.down_proj.weight_scale": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.40.gate_proj.weight": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.40.gate_proj.weight_scale": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.40.up_proj.weight": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.40.up_proj.weight_scale": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.41.down_proj.weight": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.41.down_proj.weight_scale": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.41.gate_proj.weight": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.41.gate_proj.weight_scale": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.41.up_proj.weight": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.41.up_proj.weight_scale": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.42.down_proj.weight": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.42.down_proj.weight_scale": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.42.gate_proj.weight": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.42.gate_proj.weight_scale": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.42.up_proj.weight": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.42.up_proj.weight_scale": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.43.down_proj.weight": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.43.down_proj.weight_scale": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.43.gate_proj.weight": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.43.gate_proj.weight_scale": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.43.up_proj.weight": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.43.up_proj.weight_scale": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.44.down_proj.weight": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.44.down_proj.weight_scale": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.44.gate_proj.weight": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.44.gate_proj.weight_scale": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.44.up_proj.weight": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.44.up_proj.weight_scale": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.45.down_proj.weight": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.45.down_proj.weight_scale": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.45.gate_proj.weight": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.45.gate_proj.weight_scale": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.45.up_proj.weight": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.45.up_proj.weight_scale": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.46.down_proj.weight": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.46.down_proj.weight_scale": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.46.gate_proj.weight": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.46.gate_proj.weight_scale": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.46.up_proj.weight": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.46.up_proj.weight_scale": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.47.down_proj.weight": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.47.down_proj.weight_scale": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.47.gate_proj.weight": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.47.gate_proj.weight_scale": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.47.up_proj.weight": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.47.up_proj.weight_scale": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.48.down_proj.weight": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.48.down_proj.weight_scale": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.48.gate_proj.weight": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.48.gate_proj.weight_scale": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.48.up_proj.weight": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.48.up_proj.weight_scale": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.49.down_proj.weight": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.49.down_proj.weight_scale": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.49.gate_proj.weight": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.49.gate_proj.weight_scale": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.49.up_proj.weight": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.49.up_proj.weight_scale": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.5.down_proj.weight": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.5.down_proj.weight_scale": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.5.gate_proj.weight": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.5.gate_proj.weight_scale": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.5.up_proj.weight": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.5.up_proj.weight_scale": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.50.down_proj.weight": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.50.down_proj.weight_scale": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.50.gate_proj.weight": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.50.gate_proj.weight_scale": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.50.up_proj.weight": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.50.up_proj.weight_scale": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.51.down_proj.weight": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.51.down_proj.weight_scale": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.51.gate_proj.weight": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.51.gate_proj.weight_scale": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.51.up_proj.weight": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.51.up_proj.weight_scale": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.52.down_proj.weight": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.52.down_proj.weight_scale": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.52.gate_proj.weight": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.52.gate_proj.weight_scale": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.52.up_proj.weight": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.52.up_proj.weight_scale": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.53.down_proj.weight": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.53.down_proj.weight_scale": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.53.gate_proj.weight": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.53.gate_proj.weight_scale": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.53.up_proj.weight": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.53.up_proj.weight_scale": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.54.down_proj.weight": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.54.down_proj.weight_scale": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.54.gate_proj.weight": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.54.gate_proj.weight_scale": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.54.up_proj.weight": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.54.up_proj.weight_scale": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.55.down_proj.weight": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.55.down_proj.weight_scale": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.55.gate_proj.weight": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.55.gate_proj.weight_scale": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.55.up_proj.weight": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.55.up_proj.weight_scale": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.56.down_proj.weight": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.56.down_proj.weight_scale": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.56.gate_proj.weight": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.56.gate_proj.weight_scale": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.56.up_proj.weight": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.56.up_proj.weight_scale": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.57.down_proj.weight": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.57.down_proj.weight_scale": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.57.gate_proj.weight": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.57.gate_proj.weight_scale": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.57.up_proj.weight": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.57.up_proj.weight_scale": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.58.down_proj.weight": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.58.down_proj.weight_scale": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.58.gate_proj.weight": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.58.gate_proj.weight_scale": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.58.up_proj.weight": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.58.up_proj.weight_scale": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.59.down_proj.weight": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.59.down_proj.weight_scale": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.59.gate_proj.weight": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.59.gate_proj.weight_scale": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.59.up_proj.weight": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.59.up_proj.weight_scale": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.6.down_proj.weight": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.6.down_proj.weight_scale": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.6.gate_proj.weight": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.6.gate_proj.weight_scale": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.6.up_proj.weight": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.6.up_proj.weight_scale": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.60.down_proj.weight": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.60.down_proj.weight_scale": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.60.gate_proj.weight": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.60.gate_proj.weight_scale": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.60.up_proj.weight": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.60.up_proj.weight_scale": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.61.down_proj.weight": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.61.down_proj.weight_scale": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.61.gate_proj.weight": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.61.gate_proj.weight_scale": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.61.up_proj.weight": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.61.up_proj.weight_scale": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.62.down_proj.weight": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.62.down_proj.weight_scale": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.62.gate_proj.weight": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.62.gate_proj.weight_scale": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.62.up_proj.weight": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.62.up_proj.weight_scale": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.63.down_proj.weight": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.63.down_proj.weight_scale": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.63.gate_proj.weight": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.63.gate_proj.weight_scale": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.63.up_proj.weight": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.63.up_proj.weight_scale": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.64.down_proj.weight": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.64.down_proj.weight_scale": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.64.gate_proj.weight": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.64.gate_proj.weight_scale": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.64.up_proj.weight": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.64.up_proj.weight_scale": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.65.down_proj.weight": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.65.down_proj.weight_scale": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.65.gate_proj.weight": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.65.gate_proj.weight_scale": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.65.up_proj.weight": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.65.up_proj.weight_scale": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.66.down_proj.weight": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.66.down_proj.weight_scale": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.66.gate_proj.weight": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.66.gate_proj.weight_scale": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.66.up_proj.weight": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.66.up_proj.weight_scale": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.67.down_proj.weight": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.67.down_proj.weight_scale": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.67.gate_proj.weight": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.67.gate_proj.weight_scale": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.67.up_proj.weight": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.67.up_proj.weight_scale": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.68.down_proj.weight": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.68.down_proj.weight_scale": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.68.gate_proj.weight": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.68.gate_proj.weight_scale": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.68.up_proj.weight": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.68.up_proj.weight_scale": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.69.down_proj.weight": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.69.down_proj.weight_scale": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.69.gate_proj.weight": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.69.gate_proj.weight_scale": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.69.up_proj.weight": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.69.up_proj.weight_scale": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.7.down_proj.weight": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.7.down_proj.weight_scale": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.7.gate_proj.weight": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.7.gate_proj.weight_scale": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.7.up_proj.weight": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.7.up_proj.weight_scale": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.70.down_proj.weight": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.70.down_proj.weight_scale": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.70.gate_proj.weight": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.70.gate_proj.weight_scale": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.70.up_proj.weight": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.70.up_proj.weight_scale": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.71.down_proj.weight": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.71.down_proj.weight_scale": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.71.gate_proj.weight": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.71.gate_proj.weight_scale": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.71.up_proj.weight": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.71.up_proj.weight_scale": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.72.down_proj.weight": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.72.down_proj.weight_scale": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.72.gate_proj.weight": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.72.gate_proj.weight_scale": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.72.up_proj.weight": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.72.up_proj.weight_scale": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.73.down_proj.weight": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.73.down_proj.weight_scale": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.73.gate_proj.weight": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.73.gate_proj.weight_scale": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.73.up_proj.weight": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.73.up_proj.weight_scale": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.74.down_proj.weight": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.74.down_proj.weight_scale": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.74.gate_proj.weight": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.74.gate_proj.weight_scale": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.74.up_proj.weight": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.74.up_proj.weight_scale": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.75.down_proj.weight": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.75.down_proj.weight_scale": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.75.gate_proj.weight": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.75.gate_proj.weight_scale": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.75.up_proj.weight": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.75.up_proj.weight_scale": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.76.down_proj.weight": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.76.down_proj.weight_scale": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.76.gate_proj.weight": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.76.gate_proj.weight_scale": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.76.up_proj.weight": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.76.up_proj.weight_scale": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.77.down_proj.weight": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.77.down_proj.weight_scale": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.77.gate_proj.weight": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.77.gate_proj.weight_scale": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.77.up_proj.weight": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.77.up_proj.weight_scale": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.78.down_proj.weight": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.78.down_proj.weight_scale": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.78.gate_proj.weight": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.78.gate_proj.weight_scale": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.78.up_proj.weight": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.78.up_proj.weight_scale": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.79.down_proj.weight": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.79.down_proj.weight_scale": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.79.gate_proj.weight": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.79.gate_proj.weight_scale": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.79.up_proj.weight": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.79.up_proj.weight_scale": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.8.down_proj.weight": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.8.down_proj.weight_scale": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.8.gate_proj.weight": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.8.gate_proj.weight_scale": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.8.up_proj.weight": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.8.up_proj.weight_scale": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.80.down_proj.weight": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.80.down_proj.weight_scale": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.80.gate_proj.weight": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.80.gate_proj.weight_scale": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.80.up_proj.weight": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.80.up_proj.weight_scale": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.81.down_proj.weight": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.81.down_proj.weight_scale": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.81.gate_proj.weight": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.81.gate_proj.weight_scale": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.81.up_proj.weight": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.81.up_proj.weight_scale": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.82.down_proj.weight": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.82.down_proj.weight_scale": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.82.gate_proj.weight": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.82.gate_proj.weight_scale": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.82.up_proj.weight": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.82.up_proj.weight_scale": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.83.down_proj.weight": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.83.down_proj.weight_scale": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.83.gate_proj.weight": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.83.gate_proj.weight_scale": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.83.up_proj.weight": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.83.up_proj.weight_scale": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.84.down_proj.weight": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.84.down_proj.weight_scale": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.84.gate_proj.weight": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.84.gate_proj.weight_scale": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.84.up_proj.weight": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.84.up_proj.weight_scale": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.85.down_proj.weight": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.85.down_proj.weight_scale": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.85.gate_proj.weight": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.85.gate_proj.weight_scale": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.85.up_proj.weight": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.85.up_proj.weight_scale": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.86.down_proj.weight": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.86.down_proj.weight_scale": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.86.gate_proj.weight": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.86.gate_proj.weight_scale": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.86.up_proj.weight": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.86.up_proj.weight_scale": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.87.down_proj.weight": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.87.down_proj.weight_scale": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.87.gate_proj.weight": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.87.gate_proj.weight_scale": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.87.up_proj.weight": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.87.up_proj.weight_scale": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.88.down_proj.weight": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.88.down_proj.weight_scale": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.88.gate_proj.weight": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.88.gate_proj.weight_scale": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.88.up_proj.weight": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.88.up_proj.weight_scale": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.89.down_proj.weight": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.89.down_proj.weight_scale": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.89.gate_proj.weight": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.89.gate_proj.weight_scale": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.89.up_proj.weight": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.89.up_proj.weight_scale": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.9.down_proj.weight": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.9.down_proj.weight_scale": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.9.gate_proj.weight": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.9.gate_proj.weight_scale": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.9.up_proj.weight": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.9.up_proj.weight_scale": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.90.down_proj.weight": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.90.down_proj.weight_scale": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.90.gate_proj.weight": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.90.gate_proj.weight_scale": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.90.up_proj.weight": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.90.up_proj.weight_scale": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.91.down_proj.weight": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.91.down_proj.weight_scale": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.91.gate_proj.weight": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.91.gate_proj.weight_scale": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.91.up_proj.weight": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.91.up_proj.weight_scale": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.92.down_proj.weight": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.92.down_proj.weight_scale": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.92.gate_proj.weight": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.92.gate_proj.weight_scale": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.92.up_proj.weight": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.92.up_proj.weight_scale": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.93.down_proj.weight": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.93.down_proj.weight_scale": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.93.gate_proj.weight": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.93.gate_proj.weight_scale": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.93.up_proj.weight": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.93.up_proj.weight_scale": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.94.down_proj.weight": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.94.down_proj.weight_scale": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.94.gate_proj.weight": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.94.gate_proj.weight_scale": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.94.up_proj.weight": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.94.up_proj.weight_scale": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.95.down_proj.weight": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.95.down_proj.weight_scale": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.95.gate_proj.weight": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.95.gate_proj.weight_scale": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.95.up_proj.weight": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.95.up_proj.weight_scale": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.96.down_proj.weight": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.96.down_proj.weight_scale": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.96.gate_proj.weight": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.96.gate_proj.weight_scale": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.96.up_proj.weight": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.96.up_proj.weight_scale": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.97.down_proj.weight": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.97.down_proj.weight_scale": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.97.gate_proj.weight": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.97.gate_proj.weight_scale": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.97.up_proj.weight": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.97.up_proj.weight_scale": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.98.down_proj.weight": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.98.down_proj.weight_scale": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.98.gate_proj.weight": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.98.gate_proj.weight_scale": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.98.up_proj.weight": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.98.up_proj.weight_scale": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.99.down_proj.weight": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.99.down_proj.weight_scale": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.99.gate_proj.weight": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.99.gate_proj.weight_scale": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.99.up_proj.weight": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.99.up_proj.weight_scale": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.gate.e_score_correction_bias": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.gate.weight": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.shared_experts.down_proj.weight": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.shared_experts.down_proj.weight_scale": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.shared_experts.gate_proj.weight": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.shared_experts.gate_proj.weight_scale": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.shared_experts.up_proj.weight": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.shared_experts.up_proj.weight_scale": "model-00053-of-00092.safetensors",
+ "model.layers.52.post_attention_layernorm.weight": "model-00053-of-00092.safetensors",
+ "model.layers.52.self_attn.k_norm.weight": "model-00053-of-00092.safetensors",
+ "model.layers.52.self_attn.k_proj.bias": "model-00053-of-00092.safetensors",
+ "model.layers.52.self_attn.k_proj.weight": "model-00053-of-00092.safetensors",
+ "model.layers.52.self_attn.k_proj.weight_scale": "model-00053-of-00092.safetensors",
+ "model.layers.52.self_attn.o_proj.weight": "model-00053-of-00092.safetensors",
+ "model.layers.52.self_attn.o_proj.weight_scale": "model-00053-of-00092.safetensors",
+ "model.layers.52.self_attn.q_norm.weight": "model-00053-of-00092.safetensors",
+ "model.layers.52.self_attn.q_proj.bias": "model-00053-of-00092.safetensors",
+ "model.layers.52.self_attn.q_proj.weight": "model-00053-of-00092.safetensors",
+ "model.layers.52.self_attn.q_proj.weight_scale": "model-00053-of-00092.safetensors",
+ "model.layers.52.self_attn.v_proj.bias": "model-00053-of-00092.safetensors",
+ "model.layers.52.self_attn.v_proj.weight": "model-00053-of-00092.safetensors",
+ "model.layers.52.self_attn.v_proj.weight_scale": "model-00053-of-00092.safetensors",
+ "model.layers.53.input_layernorm.weight": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.0.down_proj.weight": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.0.down_proj.weight_scale": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.0.gate_proj.weight": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.0.gate_proj.weight_scale": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.0.up_proj.weight": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.0.up_proj.weight_scale": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.1.down_proj.weight": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.1.down_proj.weight_scale": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.1.gate_proj.weight": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.1.gate_proj.weight_scale": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.1.up_proj.weight": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.1.up_proj.weight_scale": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.10.down_proj.weight": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.10.down_proj.weight_scale": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.10.gate_proj.weight": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.10.gate_proj.weight_scale": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.10.up_proj.weight": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.10.up_proj.weight_scale": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.100.down_proj.weight": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.100.down_proj.weight_scale": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.100.gate_proj.weight": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.100.gate_proj.weight_scale": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.100.up_proj.weight": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.100.up_proj.weight_scale": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.101.down_proj.weight": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.101.down_proj.weight_scale": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.101.gate_proj.weight": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.101.gate_proj.weight_scale": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.101.up_proj.weight": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.101.up_proj.weight_scale": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.102.down_proj.weight": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.102.down_proj.weight_scale": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.102.gate_proj.weight": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.102.gate_proj.weight_scale": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.102.up_proj.weight": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.102.up_proj.weight_scale": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.103.down_proj.weight": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.103.down_proj.weight_scale": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.103.gate_proj.weight": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.103.gate_proj.weight_scale": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.103.up_proj.weight": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.103.up_proj.weight_scale": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.104.down_proj.weight": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.104.down_proj.weight_scale": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.104.gate_proj.weight": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.104.gate_proj.weight_scale": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.104.up_proj.weight": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.104.up_proj.weight_scale": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.105.down_proj.weight": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.105.down_proj.weight_scale": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.105.gate_proj.weight": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.105.gate_proj.weight_scale": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.105.up_proj.weight": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.105.up_proj.weight_scale": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.106.down_proj.weight": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.106.down_proj.weight_scale": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.106.gate_proj.weight": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.106.gate_proj.weight_scale": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.106.up_proj.weight": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.106.up_proj.weight_scale": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.107.down_proj.weight": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.107.down_proj.weight_scale": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.107.gate_proj.weight": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.107.gate_proj.weight_scale": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.107.up_proj.weight": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.107.up_proj.weight_scale": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.108.down_proj.weight": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.108.down_proj.weight_scale": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.108.gate_proj.weight": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.108.gate_proj.weight_scale": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.108.up_proj.weight": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.108.up_proj.weight_scale": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.109.down_proj.weight": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.109.down_proj.weight_scale": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.109.gate_proj.weight": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.109.gate_proj.weight_scale": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.109.up_proj.weight": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.109.up_proj.weight_scale": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.11.down_proj.weight": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.11.down_proj.weight_scale": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.11.gate_proj.weight": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.11.gate_proj.weight_scale": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.11.up_proj.weight": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.11.up_proj.weight_scale": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.110.down_proj.weight": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.110.down_proj.weight_scale": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.110.gate_proj.weight": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.110.gate_proj.weight_scale": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.110.up_proj.weight": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.110.up_proj.weight_scale": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.111.down_proj.weight": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.111.down_proj.weight_scale": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.111.gate_proj.weight": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.111.gate_proj.weight_scale": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.111.up_proj.weight": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.111.up_proj.weight_scale": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.112.down_proj.weight": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.112.down_proj.weight_scale": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.112.gate_proj.weight": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.112.gate_proj.weight_scale": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.112.up_proj.weight": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.112.up_proj.weight_scale": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.113.down_proj.weight": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.113.down_proj.weight_scale": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.113.gate_proj.weight": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.113.gate_proj.weight_scale": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.113.up_proj.weight": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.113.up_proj.weight_scale": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.114.down_proj.weight": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.114.down_proj.weight_scale": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.114.gate_proj.weight": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.114.gate_proj.weight_scale": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.114.up_proj.weight": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.114.up_proj.weight_scale": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.115.down_proj.weight": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.115.down_proj.weight_scale": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.115.gate_proj.weight": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.115.gate_proj.weight_scale": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.115.up_proj.weight": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.115.up_proj.weight_scale": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.116.down_proj.weight": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.116.down_proj.weight_scale": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.116.gate_proj.weight": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.116.gate_proj.weight_scale": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.116.up_proj.weight": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.116.up_proj.weight_scale": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.117.down_proj.weight": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.117.down_proj.weight_scale": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.117.gate_proj.weight": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.117.gate_proj.weight_scale": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.117.up_proj.weight": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.117.up_proj.weight_scale": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.118.down_proj.weight": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.118.down_proj.weight_scale": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.118.gate_proj.weight": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.118.gate_proj.weight_scale": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.118.up_proj.weight": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.118.up_proj.weight_scale": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.119.down_proj.weight": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.119.down_proj.weight_scale": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.119.gate_proj.weight": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.119.gate_proj.weight_scale": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.119.up_proj.weight": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.119.up_proj.weight_scale": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.12.down_proj.weight": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.12.down_proj.weight_scale": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.12.gate_proj.weight": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.12.gate_proj.weight_scale": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.12.up_proj.weight": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.12.up_proj.weight_scale": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.120.down_proj.weight": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.120.down_proj.weight_scale": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.120.gate_proj.weight": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.120.gate_proj.weight_scale": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.120.up_proj.weight": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.120.up_proj.weight_scale": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.121.down_proj.weight": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.121.down_proj.weight_scale": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.121.gate_proj.weight": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.121.gate_proj.weight_scale": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.121.up_proj.weight": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.121.up_proj.weight_scale": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.122.down_proj.weight": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.122.down_proj.weight_scale": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.122.gate_proj.weight": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.122.gate_proj.weight_scale": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.122.up_proj.weight": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.122.up_proj.weight_scale": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.123.down_proj.weight": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.123.down_proj.weight_scale": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.123.gate_proj.weight": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.123.gate_proj.weight_scale": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.123.up_proj.weight": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.123.up_proj.weight_scale": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.124.down_proj.weight": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.124.down_proj.weight_scale": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.124.gate_proj.weight": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.124.gate_proj.weight_scale": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.124.up_proj.weight": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.124.up_proj.weight_scale": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.125.down_proj.weight": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.125.down_proj.weight_scale": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.125.gate_proj.weight": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.125.gate_proj.weight_scale": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.125.up_proj.weight": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.125.up_proj.weight_scale": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.126.down_proj.weight": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.126.down_proj.weight_scale": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.126.gate_proj.weight": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.126.gate_proj.weight_scale": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.126.up_proj.weight": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.126.up_proj.weight_scale": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.127.down_proj.weight": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.127.down_proj.weight_scale": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.127.gate_proj.weight": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.127.gate_proj.weight_scale": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.127.up_proj.weight": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.127.up_proj.weight_scale": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.128.down_proj.weight": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.128.down_proj.weight_scale": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.128.gate_proj.weight": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.128.gate_proj.weight_scale": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.128.up_proj.weight": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.128.up_proj.weight_scale": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.129.down_proj.weight": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.129.down_proj.weight_scale": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.129.gate_proj.weight": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.129.gate_proj.weight_scale": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.129.up_proj.weight": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.129.up_proj.weight_scale": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.13.down_proj.weight": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.13.down_proj.weight_scale": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.13.gate_proj.weight": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.13.gate_proj.weight_scale": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.13.up_proj.weight": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.13.up_proj.weight_scale": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.130.down_proj.weight": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.130.down_proj.weight_scale": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.130.gate_proj.weight": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.130.gate_proj.weight_scale": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.130.up_proj.weight": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.130.up_proj.weight_scale": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.131.down_proj.weight": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.131.down_proj.weight_scale": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.131.gate_proj.weight": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.131.gate_proj.weight_scale": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.131.up_proj.weight": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.131.up_proj.weight_scale": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.132.down_proj.weight": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.132.down_proj.weight_scale": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.132.gate_proj.weight": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.132.gate_proj.weight_scale": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.132.up_proj.weight": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.132.up_proj.weight_scale": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.133.down_proj.weight": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.133.down_proj.weight_scale": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.133.gate_proj.weight": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.133.gate_proj.weight_scale": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.133.up_proj.weight": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.133.up_proj.weight_scale": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.134.down_proj.weight": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.134.down_proj.weight_scale": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.134.gate_proj.weight": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.134.gate_proj.weight_scale": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.134.up_proj.weight": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.134.up_proj.weight_scale": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.135.down_proj.weight": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.135.down_proj.weight_scale": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.135.gate_proj.weight": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.135.gate_proj.weight_scale": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.135.up_proj.weight": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.135.up_proj.weight_scale": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.136.down_proj.weight": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.136.down_proj.weight_scale": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.136.gate_proj.weight": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.136.gate_proj.weight_scale": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.136.up_proj.weight": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.136.up_proj.weight_scale": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.137.down_proj.weight": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.137.down_proj.weight_scale": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.137.gate_proj.weight": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.137.gate_proj.weight_scale": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.137.up_proj.weight": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.137.up_proj.weight_scale": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.138.down_proj.weight": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.138.down_proj.weight_scale": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.138.gate_proj.weight": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.138.gate_proj.weight_scale": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.138.up_proj.weight": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.138.up_proj.weight_scale": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.139.down_proj.weight": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.139.down_proj.weight_scale": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.139.gate_proj.weight": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.139.gate_proj.weight_scale": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.139.up_proj.weight": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.139.up_proj.weight_scale": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.14.down_proj.weight": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.14.down_proj.weight_scale": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.14.gate_proj.weight": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.14.gate_proj.weight_scale": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.14.up_proj.weight": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.14.up_proj.weight_scale": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.140.down_proj.weight": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.140.down_proj.weight_scale": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.140.gate_proj.weight": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.140.gate_proj.weight_scale": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.140.up_proj.weight": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.140.up_proj.weight_scale": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.141.down_proj.weight": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.141.down_proj.weight_scale": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.141.gate_proj.weight": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.141.gate_proj.weight_scale": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.141.up_proj.weight": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.141.up_proj.weight_scale": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.142.down_proj.weight": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.142.down_proj.weight_scale": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.142.gate_proj.weight": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.142.gate_proj.weight_scale": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.142.up_proj.weight": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.142.up_proj.weight_scale": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.143.down_proj.weight": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.143.down_proj.weight_scale": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.143.gate_proj.weight": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.143.gate_proj.weight_scale": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.143.up_proj.weight": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.143.up_proj.weight_scale": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.144.down_proj.weight": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.144.down_proj.weight_scale": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.144.gate_proj.weight": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.144.gate_proj.weight_scale": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.144.up_proj.weight": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.144.up_proj.weight_scale": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.145.down_proj.weight": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.145.down_proj.weight_scale": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.145.gate_proj.weight": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.145.gate_proj.weight_scale": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.145.up_proj.weight": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.145.up_proj.weight_scale": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.146.down_proj.weight": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.146.down_proj.weight_scale": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.146.gate_proj.weight": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.146.gate_proj.weight_scale": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.146.up_proj.weight": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.146.up_proj.weight_scale": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.147.down_proj.weight": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.147.down_proj.weight_scale": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.147.gate_proj.weight": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.147.gate_proj.weight_scale": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.147.up_proj.weight": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.147.up_proj.weight_scale": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.148.down_proj.weight": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.148.down_proj.weight_scale": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.148.gate_proj.weight": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.148.gate_proj.weight_scale": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.148.up_proj.weight": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.148.up_proj.weight_scale": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.149.down_proj.weight": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.149.down_proj.weight_scale": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.149.gate_proj.weight": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.149.gate_proj.weight_scale": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.149.up_proj.weight": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.149.up_proj.weight_scale": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.15.down_proj.weight": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.15.down_proj.weight_scale": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.15.gate_proj.weight": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.15.gate_proj.weight_scale": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.15.up_proj.weight": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.15.up_proj.weight_scale": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.150.down_proj.weight": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.150.down_proj.weight_scale": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.150.gate_proj.weight": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.150.gate_proj.weight_scale": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.150.up_proj.weight": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.150.up_proj.weight_scale": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.151.down_proj.weight": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.151.down_proj.weight_scale": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.151.gate_proj.weight": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.151.gate_proj.weight_scale": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.151.up_proj.weight": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.151.up_proj.weight_scale": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.152.down_proj.weight": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.152.down_proj.weight_scale": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.152.gate_proj.weight": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.152.gate_proj.weight_scale": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.152.up_proj.weight": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.152.up_proj.weight_scale": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.153.down_proj.weight": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.153.down_proj.weight_scale": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.153.gate_proj.weight": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.153.gate_proj.weight_scale": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.153.up_proj.weight": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.153.up_proj.weight_scale": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.154.down_proj.weight": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.154.down_proj.weight_scale": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.154.gate_proj.weight": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.154.gate_proj.weight_scale": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.154.up_proj.weight": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.154.up_proj.weight_scale": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.155.down_proj.weight": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.155.down_proj.weight_scale": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.155.gate_proj.weight": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.155.gate_proj.weight_scale": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.155.up_proj.weight": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.155.up_proj.weight_scale": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.156.down_proj.weight": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.156.down_proj.weight_scale": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.156.gate_proj.weight": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.156.gate_proj.weight_scale": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.156.up_proj.weight": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.156.up_proj.weight_scale": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.157.down_proj.weight": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.157.down_proj.weight_scale": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.157.gate_proj.weight": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.157.gate_proj.weight_scale": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.157.up_proj.weight": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.157.up_proj.weight_scale": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.158.down_proj.weight": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.158.down_proj.weight_scale": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.158.gate_proj.weight": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.158.gate_proj.weight_scale": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.158.up_proj.weight": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.158.up_proj.weight_scale": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.159.down_proj.weight": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.159.down_proj.weight_scale": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.159.gate_proj.weight": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.159.gate_proj.weight_scale": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.159.up_proj.weight": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.159.up_proj.weight_scale": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.16.down_proj.weight": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.16.down_proj.weight_scale": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.16.gate_proj.weight": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.16.gate_proj.weight_scale": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.16.up_proj.weight": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.16.up_proj.weight_scale": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.17.down_proj.weight": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.17.down_proj.weight_scale": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.17.gate_proj.weight": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.17.gate_proj.weight_scale": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.17.up_proj.weight": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.17.up_proj.weight_scale": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.18.down_proj.weight": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.18.down_proj.weight_scale": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.18.gate_proj.weight": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.18.gate_proj.weight_scale": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.18.up_proj.weight": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.18.up_proj.weight_scale": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.19.down_proj.weight": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.19.down_proj.weight_scale": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.19.gate_proj.weight": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.19.gate_proj.weight_scale": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.19.up_proj.weight": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.19.up_proj.weight_scale": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.2.down_proj.weight": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.2.down_proj.weight_scale": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.2.gate_proj.weight": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.2.gate_proj.weight_scale": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.2.up_proj.weight": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.2.up_proj.weight_scale": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.20.down_proj.weight": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.20.down_proj.weight_scale": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.20.gate_proj.weight": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.20.gate_proj.weight_scale": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.20.up_proj.weight": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.20.up_proj.weight_scale": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.21.down_proj.weight": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.21.down_proj.weight_scale": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.21.gate_proj.weight": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.21.gate_proj.weight_scale": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.21.up_proj.weight": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.21.up_proj.weight_scale": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.22.down_proj.weight": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.22.down_proj.weight_scale": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.22.gate_proj.weight": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.22.gate_proj.weight_scale": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.22.up_proj.weight": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.22.up_proj.weight_scale": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.23.down_proj.weight": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.23.down_proj.weight_scale": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.23.gate_proj.weight": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.23.gate_proj.weight_scale": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.23.up_proj.weight": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.23.up_proj.weight_scale": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.24.down_proj.weight": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.24.down_proj.weight_scale": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.24.gate_proj.weight": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.24.gate_proj.weight_scale": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.24.up_proj.weight": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.24.up_proj.weight_scale": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.25.down_proj.weight": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.25.down_proj.weight_scale": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.25.gate_proj.weight": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.25.gate_proj.weight_scale": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.25.up_proj.weight": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.25.up_proj.weight_scale": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.26.down_proj.weight": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.26.down_proj.weight_scale": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.26.gate_proj.weight": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.26.gate_proj.weight_scale": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.26.up_proj.weight": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.26.up_proj.weight_scale": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.27.down_proj.weight": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.27.down_proj.weight_scale": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.27.gate_proj.weight": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.27.gate_proj.weight_scale": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.27.up_proj.weight": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.27.up_proj.weight_scale": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.28.down_proj.weight": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.28.down_proj.weight_scale": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.28.gate_proj.weight": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.28.gate_proj.weight_scale": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.28.up_proj.weight": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.28.up_proj.weight_scale": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.29.down_proj.weight": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.29.down_proj.weight_scale": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.29.gate_proj.weight": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.29.gate_proj.weight_scale": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.29.up_proj.weight": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.29.up_proj.weight_scale": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.3.down_proj.weight": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.3.down_proj.weight_scale": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.3.gate_proj.weight": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.3.gate_proj.weight_scale": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.3.up_proj.weight": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.3.up_proj.weight_scale": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.30.down_proj.weight": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.30.down_proj.weight_scale": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.30.gate_proj.weight": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.30.gate_proj.weight_scale": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.30.up_proj.weight": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.30.up_proj.weight_scale": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.31.down_proj.weight": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.31.down_proj.weight_scale": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.31.gate_proj.weight": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.31.gate_proj.weight_scale": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.31.up_proj.weight": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.31.up_proj.weight_scale": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.32.down_proj.weight": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.32.down_proj.weight_scale": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.32.gate_proj.weight": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.32.gate_proj.weight_scale": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.32.up_proj.weight": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.32.up_proj.weight_scale": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.33.down_proj.weight": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.33.down_proj.weight_scale": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.33.gate_proj.weight": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.33.gate_proj.weight_scale": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.33.up_proj.weight": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.33.up_proj.weight_scale": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.34.down_proj.weight": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.34.down_proj.weight_scale": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.34.gate_proj.weight": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.34.gate_proj.weight_scale": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.34.up_proj.weight": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.34.up_proj.weight_scale": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.35.down_proj.weight": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.35.down_proj.weight_scale": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.35.gate_proj.weight": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.35.gate_proj.weight_scale": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.35.up_proj.weight": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.35.up_proj.weight_scale": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.36.down_proj.weight": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.36.down_proj.weight_scale": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.36.gate_proj.weight": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.36.gate_proj.weight_scale": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.36.up_proj.weight": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.36.up_proj.weight_scale": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.37.down_proj.weight": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.37.down_proj.weight_scale": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.37.gate_proj.weight": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.37.gate_proj.weight_scale": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.37.up_proj.weight": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.37.up_proj.weight_scale": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.38.down_proj.weight": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.38.down_proj.weight_scale": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.38.gate_proj.weight": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.38.gate_proj.weight_scale": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.38.up_proj.weight": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.38.up_proj.weight_scale": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.39.down_proj.weight": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.39.down_proj.weight_scale": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.39.gate_proj.weight": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.39.gate_proj.weight_scale": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.39.up_proj.weight": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.39.up_proj.weight_scale": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.4.down_proj.weight": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.4.down_proj.weight_scale": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.4.gate_proj.weight": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.4.gate_proj.weight_scale": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.4.up_proj.weight": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.4.up_proj.weight_scale": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.40.down_proj.weight": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.40.down_proj.weight_scale": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.40.gate_proj.weight": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.40.gate_proj.weight_scale": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.40.up_proj.weight": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.40.up_proj.weight_scale": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.41.down_proj.weight": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.41.down_proj.weight_scale": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.41.gate_proj.weight": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.41.gate_proj.weight_scale": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.41.up_proj.weight": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.41.up_proj.weight_scale": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.42.down_proj.weight": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.42.down_proj.weight_scale": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.42.gate_proj.weight": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.42.gate_proj.weight_scale": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.42.up_proj.weight": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.42.up_proj.weight_scale": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.43.down_proj.weight": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.43.down_proj.weight_scale": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.43.gate_proj.weight": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.43.gate_proj.weight_scale": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.43.up_proj.weight": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.43.up_proj.weight_scale": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.44.down_proj.weight": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.44.down_proj.weight_scale": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.44.gate_proj.weight": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.44.gate_proj.weight_scale": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.44.up_proj.weight": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.44.up_proj.weight_scale": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.45.down_proj.weight": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.45.down_proj.weight_scale": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.45.gate_proj.weight": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.45.gate_proj.weight_scale": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.45.up_proj.weight": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.45.up_proj.weight_scale": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.46.down_proj.weight": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.46.down_proj.weight_scale": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.46.gate_proj.weight": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.46.gate_proj.weight_scale": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.46.up_proj.weight": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.46.up_proj.weight_scale": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.47.down_proj.weight": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.47.down_proj.weight_scale": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.47.gate_proj.weight": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.47.gate_proj.weight_scale": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.47.up_proj.weight": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.47.up_proj.weight_scale": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.48.down_proj.weight": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.48.down_proj.weight_scale": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.48.gate_proj.weight": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.48.gate_proj.weight_scale": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.48.up_proj.weight": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.48.up_proj.weight_scale": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.49.down_proj.weight": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.49.down_proj.weight_scale": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.49.gate_proj.weight": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.49.gate_proj.weight_scale": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.49.up_proj.weight": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.49.up_proj.weight_scale": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.5.down_proj.weight": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.5.down_proj.weight_scale": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.5.gate_proj.weight": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.5.gate_proj.weight_scale": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.5.up_proj.weight": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.5.up_proj.weight_scale": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.50.down_proj.weight": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.50.down_proj.weight_scale": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.50.gate_proj.weight": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.50.gate_proj.weight_scale": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.50.up_proj.weight": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.50.up_proj.weight_scale": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.51.down_proj.weight": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.51.down_proj.weight_scale": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.51.gate_proj.weight": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.51.gate_proj.weight_scale": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.51.up_proj.weight": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.51.up_proj.weight_scale": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.52.down_proj.weight": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.52.down_proj.weight_scale": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.52.gate_proj.weight": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.52.gate_proj.weight_scale": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.52.up_proj.weight": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.52.up_proj.weight_scale": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.53.down_proj.weight": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.53.down_proj.weight_scale": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.53.gate_proj.weight": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.53.gate_proj.weight_scale": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.53.up_proj.weight": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.53.up_proj.weight_scale": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.54.down_proj.weight": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.54.down_proj.weight_scale": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.54.gate_proj.weight": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.54.gate_proj.weight_scale": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.54.up_proj.weight": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.54.up_proj.weight_scale": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.55.down_proj.weight": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.55.down_proj.weight_scale": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.55.gate_proj.weight": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.55.gate_proj.weight_scale": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.55.up_proj.weight": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.55.up_proj.weight_scale": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.56.down_proj.weight": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.56.down_proj.weight_scale": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.56.gate_proj.weight": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.56.gate_proj.weight_scale": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.56.up_proj.weight": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.56.up_proj.weight_scale": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.57.down_proj.weight": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.57.down_proj.weight_scale": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.57.gate_proj.weight": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.57.gate_proj.weight_scale": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.57.up_proj.weight": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.57.up_proj.weight_scale": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.58.down_proj.weight": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.58.down_proj.weight_scale": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.58.gate_proj.weight": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.58.gate_proj.weight_scale": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.58.up_proj.weight": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.58.up_proj.weight_scale": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.59.down_proj.weight": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.59.down_proj.weight_scale": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.59.gate_proj.weight": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.59.gate_proj.weight_scale": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.59.up_proj.weight": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.59.up_proj.weight_scale": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.6.down_proj.weight": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.6.down_proj.weight_scale": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.6.gate_proj.weight": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.6.gate_proj.weight_scale": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.6.up_proj.weight": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.6.up_proj.weight_scale": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.60.down_proj.weight": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.60.down_proj.weight_scale": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.60.gate_proj.weight": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.60.gate_proj.weight_scale": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.60.up_proj.weight": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.60.up_proj.weight_scale": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.61.down_proj.weight": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.61.down_proj.weight_scale": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.61.gate_proj.weight": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.61.gate_proj.weight_scale": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.61.up_proj.weight": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.61.up_proj.weight_scale": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.62.down_proj.weight": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.62.down_proj.weight_scale": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.62.gate_proj.weight": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.62.gate_proj.weight_scale": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.62.up_proj.weight": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.62.up_proj.weight_scale": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.63.down_proj.weight": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.63.down_proj.weight_scale": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.63.gate_proj.weight": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.63.gate_proj.weight_scale": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.63.up_proj.weight": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.63.up_proj.weight_scale": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.64.down_proj.weight": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.64.down_proj.weight_scale": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.64.gate_proj.weight": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.64.gate_proj.weight_scale": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.64.up_proj.weight": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.64.up_proj.weight_scale": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.65.down_proj.weight": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.65.down_proj.weight_scale": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.65.gate_proj.weight": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.65.gate_proj.weight_scale": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.65.up_proj.weight": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.65.up_proj.weight_scale": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.66.down_proj.weight": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.66.down_proj.weight_scale": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.66.gate_proj.weight": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.66.gate_proj.weight_scale": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.66.up_proj.weight": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.66.up_proj.weight_scale": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.67.down_proj.weight": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.67.down_proj.weight_scale": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.67.gate_proj.weight": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.67.gate_proj.weight_scale": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.67.up_proj.weight": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.67.up_proj.weight_scale": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.68.down_proj.weight": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.68.down_proj.weight_scale": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.68.gate_proj.weight": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.68.gate_proj.weight_scale": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.68.up_proj.weight": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.68.up_proj.weight_scale": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.69.down_proj.weight": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.69.down_proj.weight_scale": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.69.gate_proj.weight": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.69.gate_proj.weight_scale": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.69.up_proj.weight": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.69.up_proj.weight_scale": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.7.down_proj.weight": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.7.down_proj.weight_scale": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.7.gate_proj.weight": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.7.gate_proj.weight_scale": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.7.up_proj.weight": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.7.up_proj.weight_scale": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.70.down_proj.weight": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.70.down_proj.weight_scale": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.70.gate_proj.weight": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.70.gate_proj.weight_scale": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.70.up_proj.weight": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.70.up_proj.weight_scale": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.71.down_proj.weight": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.71.down_proj.weight_scale": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.71.gate_proj.weight": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.71.gate_proj.weight_scale": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.71.up_proj.weight": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.71.up_proj.weight_scale": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.72.down_proj.weight": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.72.down_proj.weight_scale": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.72.gate_proj.weight": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.72.gate_proj.weight_scale": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.72.up_proj.weight": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.72.up_proj.weight_scale": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.73.down_proj.weight": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.73.down_proj.weight_scale": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.73.gate_proj.weight": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.73.gate_proj.weight_scale": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.73.up_proj.weight": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.73.up_proj.weight_scale": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.74.down_proj.weight": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.74.down_proj.weight_scale": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.74.gate_proj.weight": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.74.gate_proj.weight_scale": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.74.up_proj.weight": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.74.up_proj.weight_scale": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.75.down_proj.weight": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.75.down_proj.weight_scale": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.75.gate_proj.weight": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.75.gate_proj.weight_scale": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.75.up_proj.weight": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.75.up_proj.weight_scale": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.76.down_proj.weight": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.76.down_proj.weight_scale": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.76.gate_proj.weight": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.76.gate_proj.weight_scale": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.76.up_proj.weight": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.76.up_proj.weight_scale": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.77.down_proj.weight": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.77.down_proj.weight_scale": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.77.gate_proj.weight": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.77.gate_proj.weight_scale": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.77.up_proj.weight": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.77.up_proj.weight_scale": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.78.down_proj.weight": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.78.down_proj.weight_scale": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.78.gate_proj.weight": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.78.gate_proj.weight_scale": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.78.up_proj.weight": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.78.up_proj.weight_scale": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.79.down_proj.weight": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.79.down_proj.weight_scale": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.79.gate_proj.weight": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.79.gate_proj.weight_scale": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.79.up_proj.weight": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.79.up_proj.weight_scale": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.8.down_proj.weight": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.8.down_proj.weight_scale": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.8.gate_proj.weight": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.8.gate_proj.weight_scale": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.8.up_proj.weight": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.8.up_proj.weight_scale": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.80.down_proj.weight": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.80.down_proj.weight_scale": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.80.gate_proj.weight": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.80.gate_proj.weight_scale": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.80.up_proj.weight": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.80.up_proj.weight_scale": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.81.down_proj.weight": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.81.down_proj.weight_scale": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.81.gate_proj.weight": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.81.gate_proj.weight_scale": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.81.up_proj.weight": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.81.up_proj.weight_scale": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.82.down_proj.weight": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.82.down_proj.weight_scale": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.82.gate_proj.weight": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.82.gate_proj.weight_scale": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.82.up_proj.weight": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.82.up_proj.weight_scale": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.83.down_proj.weight": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.83.down_proj.weight_scale": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.83.gate_proj.weight": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.83.gate_proj.weight_scale": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.83.up_proj.weight": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.83.up_proj.weight_scale": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.84.down_proj.weight": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.84.down_proj.weight_scale": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.84.gate_proj.weight": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.84.gate_proj.weight_scale": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.84.up_proj.weight": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.84.up_proj.weight_scale": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.85.down_proj.weight": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.85.down_proj.weight_scale": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.85.gate_proj.weight": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.85.gate_proj.weight_scale": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.85.up_proj.weight": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.85.up_proj.weight_scale": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.86.down_proj.weight": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.86.down_proj.weight_scale": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.86.gate_proj.weight": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.86.gate_proj.weight_scale": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.86.up_proj.weight": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.86.up_proj.weight_scale": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.87.down_proj.weight": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.87.down_proj.weight_scale": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.87.gate_proj.weight": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.87.gate_proj.weight_scale": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.87.up_proj.weight": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.87.up_proj.weight_scale": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.88.down_proj.weight": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.88.down_proj.weight_scale": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.88.gate_proj.weight": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.88.gate_proj.weight_scale": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.88.up_proj.weight": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.88.up_proj.weight_scale": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.89.down_proj.weight": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.89.down_proj.weight_scale": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.89.gate_proj.weight": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.89.gate_proj.weight_scale": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.89.up_proj.weight": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.89.up_proj.weight_scale": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.9.down_proj.weight": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.9.down_proj.weight_scale": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.9.gate_proj.weight": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.9.gate_proj.weight_scale": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.9.up_proj.weight": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.9.up_proj.weight_scale": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.90.down_proj.weight": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.90.down_proj.weight_scale": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.90.gate_proj.weight": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.90.gate_proj.weight_scale": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.90.up_proj.weight": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.90.up_proj.weight_scale": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.91.down_proj.weight": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.91.down_proj.weight_scale": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.91.gate_proj.weight": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.91.gate_proj.weight_scale": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.91.up_proj.weight": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.91.up_proj.weight_scale": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.92.down_proj.weight": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.92.down_proj.weight_scale": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.92.gate_proj.weight": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.92.gate_proj.weight_scale": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.92.up_proj.weight": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.92.up_proj.weight_scale": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.93.down_proj.weight": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.93.down_proj.weight_scale": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.93.gate_proj.weight": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.93.gate_proj.weight_scale": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.93.up_proj.weight": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.93.up_proj.weight_scale": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.94.down_proj.weight": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.94.down_proj.weight_scale": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.94.gate_proj.weight": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.94.gate_proj.weight_scale": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.94.up_proj.weight": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.94.up_proj.weight_scale": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.95.down_proj.weight": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.95.down_proj.weight_scale": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.95.gate_proj.weight": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.95.gate_proj.weight_scale": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.95.up_proj.weight": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.95.up_proj.weight_scale": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.96.down_proj.weight": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.96.down_proj.weight_scale": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.96.gate_proj.weight": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.96.gate_proj.weight_scale": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.96.up_proj.weight": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.96.up_proj.weight_scale": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.97.down_proj.weight": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.97.down_proj.weight_scale": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.97.gate_proj.weight": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.97.gate_proj.weight_scale": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.97.up_proj.weight": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.97.up_proj.weight_scale": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.98.down_proj.weight": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.98.down_proj.weight_scale": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.98.gate_proj.weight": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.98.gate_proj.weight_scale": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.98.up_proj.weight": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.98.up_proj.weight_scale": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.99.down_proj.weight": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.99.down_proj.weight_scale": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.99.gate_proj.weight": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.99.gate_proj.weight_scale": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.99.up_proj.weight": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.99.up_proj.weight_scale": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.gate.e_score_correction_bias": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.gate.weight": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.shared_experts.down_proj.weight": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.shared_experts.down_proj.weight_scale": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.shared_experts.gate_proj.weight": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.shared_experts.gate_proj.weight_scale": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.shared_experts.up_proj.weight": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.shared_experts.up_proj.weight_scale": "model-00054-of-00092.safetensors",
+ "model.layers.53.post_attention_layernorm.weight": "model-00054-of-00092.safetensors",
+ "model.layers.53.self_attn.k_norm.weight": "model-00054-of-00092.safetensors",
+ "model.layers.53.self_attn.k_proj.bias": "model-00054-of-00092.safetensors",
+ "model.layers.53.self_attn.k_proj.weight": "model-00054-of-00092.safetensors",
+ "model.layers.53.self_attn.k_proj.weight_scale": "model-00054-of-00092.safetensors",
+ "model.layers.53.self_attn.o_proj.weight": "model-00054-of-00092.safetensors",
+ "model.layers.53.self_attn.o_proj.weight_scale": "model-00054-of-00092.safetensors",
+ "model.layers.53.self_attn.q_norm.weight": "model-00054-of-00092.safetensors",
+ "model.layers.53.self_attn.q_proj.bias": "model-00054-of-00092.safetensors",
+ "model.layers.53.self_attn.q_proj.weight": "model-00054-of-00092.safetensors",
+ "model.layers.53.self_attn.q_proj.weight_scale": "model-00054-of-00092.safetensors",
+ "model.layers.53.self_attn.v_proj.bias": "model-00054-of-00092.safetensors",
+ "model.layers.53.self_attn.v_proj.weight": "model-00054-of-00092.safetensors",
+ "model.layers.53.self_attn.v_proj.weight_scale": "model-00054-of-00092.safetensors",
+ "model.layers.54.input_layernorm.weight": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.0.down_proj.weight": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.0.down_proj.weight_scale": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.0.gate_proj.weight": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.0.gate_proj.weight_scale": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.0.up_proj.weight": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.0.up_proj.weight_scale": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.1.down_proj.weight": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.1.down_proj.weight_scale": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.1.gate_proj.weight": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.1.gate_proj.weight_scale": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.1.up_proj.weight": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.1.up_proj.weight_scale": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.10.down_proj.weight": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.10.down_proj.weight_scale": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.10.gate_proj.weight": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.10.gate_proj.weight_scale": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.10.up_proj.weight": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.10.up_proj.weight_scale": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.100.down_proj.weight": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.100.down_proj.weight_scale": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.100.gate_proj.weight": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.100.gate_proj.weight_scale": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.100.up_proj.weight": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.100.up_proj.weight_scale": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.101.down_proj.weight": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.101.down_proj.weight_scale": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.101.gate_proj.weight": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.101.gate_proj.weight_scale": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.101.up_proj.weight": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.101.up_proj.weight_scale": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.102.down_proj.weight": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.102.down_proj.weight_scale": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.102.gate_proj.weight": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.102.gate_proj.weight_scale": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.102.up_proj.weight": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.102.up_proj.weight_scale": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.103.down_proj.weight": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.103.down_proj.weight_scale": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.103.gate_proj.weight": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.103.gate_proj.weight_scale": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.103.up_proj.weight": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.103.up_proj.weight_scale": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.104.down_proj.weight": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.104.down_proj.weight_scale": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.104.gate_proj.weight": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.104.gate_proj.weight_scale": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.104.up_proj.weight": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.104.up_proj.weight_scale": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.105.down_proj.weight": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.105.down_proj.weight_scale": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.105.gate_proj.weight": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.105.gate_proj.weight_scale": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.105.up_proj.weight": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.105.up_proj.weight_scale": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.106.down_proj.weight": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.106.down_proj.weight_scale": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.106.gate_proj.weight": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.106.gate_proj.weight_scale": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.106.up_proj.weight": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.106.up_proj.weight_scale": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.107.down_proj.weight": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.107.down_proj.weight_scale": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.107.gate_proj.weight": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.107.gate_proj.weight_scale": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.107.up_proj.weight": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.107.up_proj.weight_scale": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.108.down_proj.weight": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.108.down_proj.weight_scale": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.108.gate_proj.weight": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.108.gate_proj.weight_scale": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.108.up_proj.weight": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.108.up_proj.weight_scale": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.109.down_proj.weight": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.109.down_proj.weight_scale": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.109.gate_proj.weight": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.109.gate_proj.weight_scale": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.109.up_proj.weight": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.109.up_proj.weight_scale": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.11.down_proj.weight": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.11.down_proj.weight_scale": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.11.gate_proj.weight": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.11.gate_proj.weight_scale": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.11.up_proj.weight": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.11.up_proj.weight_scale": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.110.down_proj.weight": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.110.down_proj.weight_scale": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.110.gate_proj.weight": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.110.gate_proj.weight_scale": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.110.up_proj.weight": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.110.up_proj.weight_scale": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.111.down_proj.weight": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.111.down_proj.weight_scale": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.111.gate_proj.weight": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.111.gate_proj.weight_scale": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.111.up_proj.weight": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.111.up_proj.weight_scale": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.112.down_proj.weight": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.112.down_proj.weight_scale": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.112.gate_proj.weight": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.112.gate_proj.weight_scale": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.112.up_proj.weight": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.112.up_proj.weight_scale": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.113.down_proj.weight": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.113.down_proj.weight_scale": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.113.gate_proj.weight": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.113.gate_proj.weight_scale": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.113.up_proj.weight": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.113.up_proj.weight_scale": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.114.down_proj.weight": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.114.down_proj.weight_scale": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.114.gate_proj.weight": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.114.gate_proj.weight_scale": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.114.up_proj.weight": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.114.up_proj.weight_scale": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.115.down_proj.weight": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.115.down_proj.weight_scale": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.115.gate_proj.weight": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.115.gate_proj.weight_scale": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.115.up_proj.weight": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.115.up_proj.weight_scale": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.116.down_proj.weight": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.116.down_proj.weight_scale": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.116.gate_proj.weight": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.116.gate_proj.weight_scale": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.116.up_proj.weight": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.116.up_proj.weight_scale": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.117.down_proj.weight": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.117.down_proj.weight_scale": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.117.gate_proj.weight": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.117.gate_proj.weight_scale": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.117.up_proj.weight": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.117.up_proj.weight_scale": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.118.down_proj.weight": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.118.down_proj.weight_scale": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.118.gate_proj.weight": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.118.gate_proj.weight_scale": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.118.up_proj.weight": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.118.up_proj.weight_scale": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.119.down_proj.weight": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.119.down_proj.weight_scale": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.119.gate_proj.weight": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.119.gate_proj.weight_scale": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.119.up_proj.weight": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.119.up_proj.weight_scale": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.12.down_proj.weight": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.12.down_proj.weight_scale": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.12.gate_proj.weight": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.12.gate_proj.weight_scale": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.12.up_proj.weight": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.12.up_proj.weight_scale": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.120.down_proj.weight": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.120.down_proj.weight_scale": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.120.gate_proj.weight": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.120.gate_proj.weight_scale": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.120.up_proj.weight": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.120.up_proj.weight_scale": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.121.down_proj.weight": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.121.down_proj.weight_scale": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.121.gate_proj.weight": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.121.gate_proj.weight_scale": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.121.up_proj.weight": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.121.up_proj.weight_scale": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.122.down_proj.weight": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.122.down_proj.weight_scale": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.122.gate_proj.weight": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.122.gate_proj.weight_scale": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.122.up_proj.weight": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.122.up_proj.weight_scale": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.123.down_proj.weight": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.123.down_proj.weight_scale": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.123.gate_proj.weight": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.123.gate_proj.weight_scale": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.123.up_proj.weight": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.123.up_proj.weight_scale": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.124.down_proj.weight": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.124.down_proj.weight_scale": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.124.gate_proj.weight": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.124.gate_proj.weight_scale": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.124.up_proj.weight": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.124.up_proj.weight_scale": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.125.down_proj.weight": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.125.down_proj.weight_scale": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.125.gate_proj.weight": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.125.gate_proj.weight_scale": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.125.up_proj.weight": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.125.up_proj.weight_scale": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.126.down_proj.weight": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.126.down_proj.weight_scale": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.126.gate_proj.weight": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.126.gate_proj.weight_scale": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.126.up_proj.weight": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.126.up_proj.weight_scale": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.127.down_proj.weight": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.127.down_proj.weight_scale": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.127.gate_proj.weight": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.127.gate_proj.weight_scale": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.127.up_proj.weight": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.127.up_proj.weight_scale": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.128.down_proj.weight": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.128.down_proj.weight_scale": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.128.gate_proj.weight": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.128.gate_proj.weight_scale": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.128.up_proj.weight": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.128.up_proj.weight_scale": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.129.down_proj.weight": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.129.down_proj.weight_scale": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.129.gate_proj.weight": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.129.gate_proj.weight_scale": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.129.up_proj.weight": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.129.up_proj.weight_scale": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.13.down_proj.weight": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.13.down_proj.weight_scale": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.13.gate_proj.weight": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.13.gate_proj.weight_scale": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.13.up_proj.weight": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.13.up_proj.weight_scale": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.130.down_proj.weight": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.130.down_proj.weight_scale": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.130.gate_proj.weight": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.130.gate_proj.weight_scale": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.130.up_proj.weight": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.130.up_proj.weight_scale": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.131.down_proj.weight": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.131.down_proj.weight_scale": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.131.gate_proj.weight": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.131.gate_proj.weight_scale": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.131.up_proj.weight": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.131.up_proj.weight_scale": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.132.down_proj.weight": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.132.down_proj.weight_scale": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.132.gate_proj.weight": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.132.gate_proj.weight_scale": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.132.up_proj.weight": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.132.up_proj.weight_scale": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.133.down_proj.weight": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.133.down_proj.weight_scale": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.133.gate_proj.weight": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.133.gate_proj.weight_scale": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.133.up_proj.weight": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.133.up_proj.weight_scale": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.134.down_proj.weight": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.134.down_proj.weight_scale": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.134.gate_proj.weight": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.134.gate_proj.weight_scale": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.134.up_proj.weight": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.134.up_proj.weight_scale": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.135.down_proj.weight": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.135.down_proj.weight_scale": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.135.gate_proj.weight": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.135.gate_proj.weight_scale": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.135.up_proj.weight": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.135.up_proj.weight_scale": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.136.down_proj.weight": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.136.down_proj.weight_scale": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.136.gate_proj.weight": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.136.gate_proj.weight_scale": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.136.up_proj.weight": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.136.up_proj.weight_scale": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.137.down_proj.weight": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.137.down_proj.weight_scale": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.137.gate_proj.weight": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.137.gate_proj.weight_scale": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.137.up_proj.weight": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.137.up_proj.weight_scale": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.138.down_proj.weight": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.138.down_proj.weight_scale": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.138.gate_proj.weight": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.138.gate_proj.weight_scale": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.138.up_proj.weight": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.138.up_proj.weight_scale": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.139.down_proj.weight": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.139.down_proj.weight_scale": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.139.gate_proj.weight": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.139.gate_proj.weight_scale": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.139.up_proj.weight": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.139.up_proj.weight_scale": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.14.down_proj.weight": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.14.down_proj.weight_scale": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.14.gate_proj.weight": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.14.gate_proj.weight_scale": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.14.up_proj.weight": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.14.up_proj.weight_scale": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.140.down_proj.weight": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.140.down_proj.weight_scale": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.140.gate_proj.weight": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.140.gate_proj.weight_scale": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.140.up_proj.weight": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.140.up_proj.weight_scale": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.141.down_proj.weight": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.141.down_proj.weight_scale": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.141.gate_proj.weight": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.141.gate_proj.weight_scale": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.141.up_proj.weight": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.141.up_proj.weight_scale": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.142.down_proj.weight": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.142.down_proj.weight_scale": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.142.gate_proj.weight": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.142.gate_proj.weight_scale": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.142.up_proj.weight": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.142.up_proj.weight_scale": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.143.down_proj.weight": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.143.down_proj.weight_scale": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.143.gate_proj.weight": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.143.gate_proj.weight_scale": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.143.up_proj.weight": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.143.up_proj.weight_scale": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.144.down_proj.weight": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.144.down_proj.weight_scale": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.144.gate_proj.weight": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.144.gate_proj.weight_scale": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.144.up_proj.weight": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.144.up_proj.weight_scale": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.145.down_proj.weight": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.145.down_proj.weight_scale": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.145.gate_proj.weight": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.145.gate_proj.weight_scale": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.145.up_proj.weight": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.145.up_proj.weight_scale": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.146.down_proj.weight": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.146.down_proj.weight_scale": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.146.gate_proj.weight": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.146.gate_proj.weight_scale": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.146.up_proj.weight": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.146.up_proj.weight_scale": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.147.down_proj.weight": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.147.down_proj.weight_scale": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.147.gate_proj.weight": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.147.gate_proj.weight_scale": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.147.up_proj.weight": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.147.up_proj.weight_scale": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.148.down_proj.weight": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.148.down_proj.weight_scale": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.148.gate_proj.weight": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.148.gate_proj.weight_scale": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.148.up_proj.weight": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.148.up_proj.weight_scale": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.149.down_proj.weight": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.149.down_proj.weight_scale": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.149.gate_proj.weight": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.149.gate_proj.weight_scale": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.149.up_proj.weight": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.149.up_proj.weight_scale": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.15.down_proj.weight": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.15.down_proj.weight_scale": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.15.gate_proj.weight": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.15.gate_proj.weight_scale": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.15.up_proj.weight": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.15.up_proj.weight_scale": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.150.down_proj.weight": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.150.down_proj.weight_scale": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.150.gate_proj.weight": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.150.gate_proj.weight_scale": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.150.up_proj.weight": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.150.up_proj.weight_scale": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.151.down_proj.weight": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.151.down_proj.weight_scale": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.151.gate_proj.weight": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.151.gate_proj.weight_scale": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.151.up_proj.weight": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.151.up_proj.weight_scale": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.152.down_proj.weight": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.152.down_proj.weight_scale": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.152.gate_proj.weight": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.152.gate_proj.weight_scale": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.152.up_proj.weight": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.152.up_proj.weight_scale": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.153.down_proj.weight": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.153.down_proj.weight_scale": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.153.gate_proj.weight": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.153.gate_proj.weight_scale": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.153.up_proj.weight": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.153.up_proj.weight_scale": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.154.down_proj.weight": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.154.down_proj.weight_scale": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.154.gate_proj.weight": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.154.gate_proj.weight_scale": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.154.up_proj.weight": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.154.up_proj.weight_scale": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.155.down_proj.weight": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.155.down_proj.weight_scale": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.155.gate_proj.weight": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.155.gate_proj.weight_scale": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.155.up_proj.weight": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.155.up_proj.weight_scale": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.156.down_proj.weight": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.156.down_proj.weight_scale": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.156.gate_proj.weight": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.156.gate_proj.weight_scale": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.156.up_proj.weight": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.156.up_proj.weight_scale": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.157.down_proj.weight": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.157.down_proj.weight_scale": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.157.gate_proj.weight": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.157.gate_proj.weight_scale": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.157.up_proj.weight": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.157.up_proj.weight_scale": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.158.down_proj.weight": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.158.down_proj.weight_scale": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.158.gate_proj.weight": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.158.gate_proj.weight_scale": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.158.up_proj.weight": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.158.up_proj.weight_scale": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.159.down_proj.weight": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.159.down_proj.weight_scale": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.159.gate_proj.weight": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.159.gate_proj.weight_scale": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.159.up_proj.weight": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.159.up_proj.weight_scale": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.16.down_proj.weight": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.16.down_proj.weight_scale": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.16.gate_proj.weight": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.16.gate_proj.weight_scale": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.16.up_proj.weight": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.16.up_proj.weight_scale": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.17.down_proj.weight": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.17.down_proj.weight_scale": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.17.gate_proj.weight": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.17.gate_proj.weight_scale": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.17.up_proj.weight": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.17.up_proj.weight_scale": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.18.down_proj.weight": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.18.down_proj.weight_scale": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.18.gate_proj.weight": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.18.gate_proj.weight_scale": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.18.up_proj.weight": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.18.up_proj.weight_scale": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.19.down_proj.weight": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.19.down_proj.weight_scale": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.19.gate_proj.weight": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.19.gate_proj.weight_scale": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.19.up_proj.weight": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.19.up_proj.weight_scale": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.2.down_proj.weight": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.2.down_proj.weight_scale": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.2.gate_proj.weight": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.2.gate_proj.weight_scale": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.2.up_proj.weight": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.2.up_proj.weight_scale": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.20.down_proj.weight": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.20.down_proj.weight_scale": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.20.gate_proj.weight": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.20.gate_proj.weight_scale": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.20.up_proj.weight": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.20.up_proj.weight_scale": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.21.down_proj.weight": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.21.down_proj.weight_scale": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.21.gate_proj.weight": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.21.gate_proj.weight_scale": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.21.up_proj.weight": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.21.up_proj.weight_scale": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.22.down_proj.weight": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.22.down_proj.weight_scale": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.22.gate_proj.weight": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.22.gate_proj.weight_scale": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.22.up_proj.weight": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.22.up_proj.weight_scale": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.23.down_proj.weight": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.23.down_proj.weight_scale": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.23.gate_proj.weight": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.23.gate_proj.weight_scale": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.23.up_proj.weight": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.23.up_proj.weight_scale": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.24.down_proj.weight": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.24.down_proj.weight_scale": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.24.gate_proj.weight": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.24.gate_proj.weight_scale": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.24.up_proj.weight": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.24.up_proj.weight_scale": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.25.down_proj.weight": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.25.down_proj.weight_scale": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.25.gate_proj.weight": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.25.gate_proj.weight_scale": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.25.up_proj.weight": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.25.up_proj.weight_scale": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.26.down_proj.weight": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.26.down_proj.weight_scale": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.26.gate_proj.weight": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.26.gate_proj.weight_scale": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.26.up_proj.weight": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.26.up_proj.weight_scale": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.27.down_proj.weight": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.27.down_proj.weight_scale": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.27.gate_proj.weight": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.27.gate_proj.weight_scale": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.27.up_proj.weight": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.27.up_proj.weight_scale": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.28.down_proj.weight": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.28.down_proj.weight_scale": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.28.gate_proj.weight": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.28.gate_proj.weight_scale": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.28.up_proj.weight": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.28.up_proj.weight_scale": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.29.down_proj.weight": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.29.down_proj.weight_scale": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.29.gate_proj.weight": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.29.gate_proj.weight_scale": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.29.up_proj.weight": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.29.up_proj.weight_scale": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.3.down_proj.weight": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.3.down_proj.weight_scale": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.3.gate_proj.weight": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.3.gate_proj.weight_scale": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.3.up_proj.weight": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.3.up_proj.weight_scale": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.30.down_proj.weight": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.30.down_proj.weight_scale": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.30.gate_proj.weight": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.30.gate_proj.weight_scale": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.30.up_proj.weight": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.30.up_proj.weight_scale": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.31.down_proj.weight": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.31.down_proj.weight_scale": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.31.gate_proj.weight": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.31.gate_proj.weight_scale": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.31.up_proj.weight": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.31.up_proj.weight_scale": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.32.down_proj.weight": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.32.down_proj.weight_scale": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.32.gate_proj.weight": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.32.gate_proj.weight_scale": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.32.up_proj.weight": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.32.up_proj.weight_scale": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.33.down_proj.weight": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.33.down_proj.weight_scale": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.33.gate_proj.weight": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.33.gate_proj.weight_scale": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.33.up_proj.weight": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.33.up_proj.weight_scale": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.34.down_proj.weight": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.34.down_proj.weight_scale": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.34.gate_proj.weight": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.34.gate_proj.weight_scale": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.34.up_proj.weight": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.34.up_proj.weight_scale": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.35.down_proj.weight": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.35.down_proj.weight_scale": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.35.gate_proj.weight": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.35.gate_proj.weight_scale": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.35.up_proj.weight": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.35.up_proj.weight_scale": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.36.down_proj.weight": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.36.down_proj.weight_scale": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.36.gate_proj.weight": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.36.gate_proj.weight_scale": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.36.up_proj.weight": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.36.up_proj.weight_scale": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.37.down_proj.weight": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.37.down_proj.weight_scale": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.37.gate_proj.weight": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.37.gate_proj.weight_scale": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.37.up_proj.weight": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.37.up_proj.weight_scale": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.38.down_proj.weight": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.38.down_proj.weight_scale": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.38.gate_proj.weight": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.38.gate_proj.weight_scale": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.38.up_proj.weight": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.38.up_proj.weight_scale": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.39.down_proj.weight": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.39.down_proj.weight_scale": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.39.gate_proj.weight": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.39.gate_proj.weight_scale": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.39.up_proj.weight": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.39.up_proj.weight_scale": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.4.down_proj.weight": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.4.down_proj.weight_scale": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.4.gate_proj.weight": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.4.gate_proj.weight_scale": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.4.up_proj.weight": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.4.up_proj.weight_scale": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.40.down_proj.weight": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.40.down_proj.weight_scale": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.40.gate_proj.weight": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.40.gate_proj.weight_scale": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.40.up_proj.weight": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.40.up_proj.weight_scale": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.41.down_proj.weight": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.41.down_proj.weight_scale": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.41.gate_proj.weight": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.41.gate_proj.weight_scale": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.41.up_proj.weight": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.41.up_proj.weight_scale": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.42.down_proj.weight": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.42.down_proj.weight_scale": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.42.gate_proj.weight": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.42.gate_proj.weight_scale": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.42.up_proj.weight": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.42.up_proj.weight_scale": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.43.down_proj.weight": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.43.down_proj.weight_scale": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.43.gate_proj.weight": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.43.gate_proj.weight_scale": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.43.up_proj.weight": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.43.up_proj.weight_scale": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.44.down_proj.weight": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.44.down_proj.weight_scale": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.44.gate_proj.weight": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.44.gate_proj.weight_scale": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.44.up_proj.weight": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.44.up_proj.weight_scale": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.45.down_proj.weight": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.45.down_proj.weight_scale": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.45.gate_proj.weight": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.45.gate_proj.weight_scale": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.45.up_proj.weight": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.45.up_proj.weight_scale": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.46.down_proj.weight": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.46.down_proj.weight_scale": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.46.gate_proj.weight": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.46.gate_proj.weight_scale": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.46.up_proj.weight": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.46.up_proj.weight_scale": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.47.down_proj.weight": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.47.down_proj.weight_scale": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.47.gate_proj.weight": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.47.gate_proj.weight_scale": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.47.up_proj.weight": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.47.up_proj.weight_scale": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.48.down_proj.weight": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.48.down_proj.weight_scale": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.48.gate_proj.weight": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.48.gate_proj.weight_scale": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.48.up_proj.weight": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.48.up_proj.weight_scale": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.49.down_proj.weight": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.49.down_proj.weight_scale": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.49.gate_proj.weight": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.49.gate_proj.weight_scale": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.49.up_proj.weight": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.49.up_proj.weight_scale": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.5.down_proj.weight": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.5.down_proj.weight_scale": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.5.gate_proj.weight": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.5.gate_proj.weight_scale": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.5.up_proj.weight": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.5.up_proj.weight_scale": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.50.down_proj.weight": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.50.down_proj.weight_scale": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.50.gate_proj.weight": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.50.gate_proj.weight_scale": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.50.up_proj.weight": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.50.up_proj.weight_scale": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.51.down_proj.weight": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.51.down_proj.weight_scale": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.51.gate_proj.weight": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.51.gate_proj.weight_scale": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.51.up_proj.weight": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.51.up_proj.weight_scale": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.52.down_proj.weight": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.52.down_proj.weight_scale": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.52.gate_proj.weight": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.52.gate_proj.weight_scale": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.52.up_proj.weight": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.52.up_proj.weight_scale": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.53.down_proj.weight": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.53.down_proj.weight_scale": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.53.gate_proj.weight": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.53.gate_proj.weight_scale": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.53.up_proj.weight": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.53.up_proj.weight_scale": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.54.down_proj.weight": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.54.down_proj.weight_scale": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.54.gate_proj.weight": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.54.gate_proj.weight_scale": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.54.up_proj.weight": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.54.up_proj.weight_scale": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.55.down_proj.weight": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.55.down_proj.weight_scale": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.55.gate_proj.weight": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.55.gate_proj.weight_scale": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.55.up_proj.weight": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.55.up_proj.weight_scale": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.56.down_proj.weight": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.56.down_proj.weight_scale": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.56.gate_proj.weight": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.56.gate_proj.weight_scale": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.56.up_proj.weight": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.56.up_proj.weight_scale": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.57.down_proj.weight": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.57.down_proj.weight_scale": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.57.gate_proj.weight": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.57.gate_proj.weight_scale": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.57.up_proj.weight": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.57.up_proj.weight_scale": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.58.down_proj.weight": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.58.down_proj.weight_scale": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.58.gate_proj.weight": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.58.gate_proj.weight_scale": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.58.up_proj.weight": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.58.up_proj.weight_scale": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.59.down_proj.weight": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.59.down_proj.weight_scale": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.59.gate_proj.weight": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.59.gate_proj.weight_scale": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.59.up_proj.weight": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.59.up_proj.weight_scale": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.6.down_proj.weight": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.6.down_proj.weight_scale": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.6.gate_proj.weight": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.6.gate_proj.weight_scale": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.6.up_proj.weight": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.6.up_proj.weight_scale": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.60.down_proj.weight": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.60.down_proj.weight_scale": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.60.gate_proj.weight": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.60.gate_proj.weight_scale": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.60.up_proj.weight": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.60.up_proj.weight_scale": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.61.down_proj.weight": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.61.down_proj.weight_scale": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.61.gate_proj.weight": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.61.gate_proj.weight_scale": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.61.up_proj.weight": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.61.up_proj.weight_scale": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.62.down_proj.weight": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.62.down_proj.weight_scale": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.62.gate_proj.weight": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.62.gate_proj.weight_scale": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.62.up_proj.weight": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.62.up_proj.weight_scale": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.63.down_proj.weight": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.63.down_proj.weight_scale": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.63.gate_proj.weight": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.63.gate_proj.weight_scale": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.63.up_proj.weight": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.63.up_proj.weight_scale": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.64.down_proj.weight": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.64.down_proj.weight_scale": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.64.gate_proj.weight": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.64.gate_proj.weight_scale": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.64.up_proj.weight": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.64.up_proj.weight_scale": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.65.down_proj.weight": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.65.down_proj.weight_scale": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.65.gate_proj.weight": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.65.gate_proj.weight_scale": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.65.up_proj.weight": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.65.up_proj.weight_scale": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.66.down_proj.weight": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.66.down_proj.weight_scale": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.66.gate_proj.weight": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.66.gate_proj.weight_scale": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.66.up_proj.weight": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.66.up_proj.weight_scale": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.67.down_proj.weight": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.67.down_proj.weight_scale": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.67.gate_proj.weight": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.67.gate_proj.weight_scale": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.67.up_proj.weight": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.67.up_proj.weight_scale": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.68.down_proj.weight": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.68.down_proj.weight_scale": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.68.gate_proj.weight": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.68.gate_proj.weight_scale": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.68.up_proj.weight": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.68.up_proj.weight_scale": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.69.down_proj.weight": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.69.down_proj.weight_scale": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.69.gate_proj.weight": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.69.gate_proj.weight_scale": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.69.up_proj.weight": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.69.up_proj.weight_scale": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.7.down_proj.weight": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.7.down_proj.weight_scale": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.7.gate_proj.weight": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.7.gate_proj.weight_scale": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.7.up_proj.weight": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.7.up_proj.weight_scale": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.70.down_proj.weight": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.70.down_proj.weight_scale": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.70.gate_proj.weight": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.70.gate_proj.weight_scale": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.70.up_proj.weight": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.70.up_proj.weight_scale": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.71.down_proj.weight": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.71.down_proj.weight_scale": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.71.gate_proj.weight": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.71.gate_proj.weight_scale": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.71.up_proj.weight": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.71.up_proj.weight_scale": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.72.down_proj.weight": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.72.down_proj.weight_scale": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.72.gate_proj.weight": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.72.gate_proj.weight_scale": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.72.up_proj.weight": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.72.up_proj.weight_scale": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.73.down_proj.weight": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.73.down_proj.weight_scale": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.73.gate_proj.weight": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.73.gate_proj.weight_scale": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.73.up_proj.weight": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.73.up_proj.weight_scale": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.74.down_proj.weight": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.74.down_proj.weight_scale": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.74.gate_proj.weight": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.74.gate_proj.weight_scale": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.74.up_proj.weight": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.74.up_proj.weight_scale": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.75.down_proj.weight": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.75.down_proj.weight_scale": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.75.gate_proj.weight": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.75.gate_proj.weight_scale": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.75.up_proj.weight": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.75.up_proj.weight_scale": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.76.down_proj.weight": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.76.down_proj.weight_scale": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.76.gate_proj.weight": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.76.gate_proj.weight_scale": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.76.up_proj.weight": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.76.up_proj.weight_scale": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.77.down_proj.weight": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.77.down_proj.weight_scale": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.77.gate_proj.weight": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.77.gate_proj.weight_scale": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.77.up_proj.weight": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.77.up_proj.weight_scale": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.78.down_proj.weight": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.78.down_proj.weight_scale": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.78.gate_proj.weight": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.78.gate_proj.weight_scale": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.78.up_proj.weight": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.78.up_proj.weight_scale": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.79.down_proj.weight": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.79.down_proj.weight_scale": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.79.gate_proj.weight": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.79.gate_proj.weight_scale": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.79.up_proj.weight": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.79.up_proj.weight_scale": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.8.down_proj.weight": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.8.down_proj.weight_scale": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.8.gate_proj.weight": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.8.gate_proj.weight_scale": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.8.up_proj.weight": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.8.up_proj.weight_scale": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.80.down_proj.weight": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.80.down_proj.weight_scale": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.80.gate_proj.weight": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.80.gate_proj.weight_scale": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.80.up_proj.weight": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.80.up_proj.weight_scale": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.81.down_proj.weight": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.81.down_proj.weight_scale": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.81.gate_proj.weight": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.81.gate_proj.weight_scale": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.81.up_proj.weight": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.81.up_proj.weight_scale": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.82.down_proj.weight": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.82.down_proj.weight_scale": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.82.gate_proj.weight": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.82.gate_proj.weight_scale": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.82.up_proj.weight": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.82.up_proj.weight_scale": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.83.down_proj.weight": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.83.down_proj.weight_scale": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.83.gate_proj.weight": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.83.gate_proj.weight_scale": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.83.up_proj.weight": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.83.up_proj.weight_scale": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.84.down_proj.weight": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.84.down_proj.weight_scale": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.84.gate_proj.weight": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.84.gate_proj.weight_scale": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.84.up_proj.weight": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.84.up_proj.weight_scale": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.85.down_proj.weight": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.85.down_proj.weight_scale": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.85.gate_proj.weight": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.85.gate_proj.weight_scale": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.85.up_proj.weight": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.85.up_proj.weight_scale": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.86.down_proj.weight": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.86.down_proj.weight_scale": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.86.gate_proj.weight": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.86.gate_proj.weight_scale": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.86.up_proj.weight": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.86.up_proj.weight_scale": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.87.down_proj.weight": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.87.down_proj.weight_scale": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.87.gate_proj.weight": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.87.gate_proj.weight_scale": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.87.up_proj.weight": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.87.up_proj.weight_scale": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.88.down_proj.weight": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.88.down_proj.weight_scale": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.88.gate_proj.weight": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.88.gate_proj.weight_scale": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.88.up_proj.weight": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.88.up_proj.weight_scale": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.89.down_proj.weight": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.89.down_proj.weight_scale": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.89.gate_proj.weight": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.89.gate_proj.weight_scale": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.89.up_proj.weight": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.89.up_proj.weight_scale": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.9.down_proj.weight": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.9.down_proj.weight_scale": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.9.gate_proj.weight": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.9.gate_proj.weight_scale": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.9.up_proj.weight": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.9.up_proj.weight_scale": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.90.down_proj.weight": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.90.down_proj.weight_scale": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.90.gate_proj.weight": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.90.gate_proj.weight_scale": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.90.up_proj.weight": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.90.up_proj.weight_scale": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.91.down_proj.weight": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.91.down_proj.weight_scale": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.91.gate_proj.weight": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.91.gate_proj.weight_scale": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.91.up_proj.weight": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.91.up_proj.weight_scale": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.92.down_proj.weight": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.92.down_proj.weight_scale": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.92.gate_proj.weight": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.92.gate_proj.weight_scale": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.92.up_proj.weight": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.92.up_proj.weight_scale": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.93.down_proj.weight": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.93.down_proj.weight_scale": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.93.gate_proj.weight": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.93.gate_proj.weight_scale": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.93.up_proj.weight": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.93.up_proj.weight_scale": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.94.down_proj.weight": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.94.down_proj.weight_scale": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.94.gate_proj.weight": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.94.gate_proj.weight_scale": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.94.up_proj.weight": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.94.up_proj.weight_scale": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.95.down_proj.weight": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.95.down_proj.weight_scale": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.95.gate_proj.weight": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.95.gate_proj.weight_scale": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.95.up_proj.weight": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.95.up_proj.weight_scale": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.96.down_proj.weight": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.96.down_proj.weight_scale": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.96.gate_proj.weight": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.96.gate_proj.weight_scale": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.96.up_proj.weight": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.96.up_proj.weight_scale": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.97.down_proj.weight": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.97.down_proj.weight_scale": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.97.gate_proj.weight": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.97.gate_proj.weight_scale": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.97.up_proj.weight": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.97.up_proj.weight_scale": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.98.down_proj.weight": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.98.down_proj.weight_scale": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.98.gate_proj.weight": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.98.gate_proj.weight_scale": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.98.up_proj.weight": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.98.up_proj.weight_scale": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.99.down_proj.weight": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.99.down_proj.weight_scale": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.99.gate_proj.weight": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.99.gate_proj.weight_scale": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.99.up_proj.weight": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.99.up_proj.weight_scale": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.gate.e_score_correction_bias": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.gate.weight": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.shared_experts.down_proj.weight": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.shared_experts.down_proj.weight_scale": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.shared_experts.gate_proj.weight": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.shared_experts.gate_proj.weight_scale": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.shared_experts.up_proj.weight": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.shared_experts.up_proj.weight_scale": "model-00055-of-00092.safetensors",
+ "model.layers.54.post_attention_layernorm.weight": "model-00055-of-00092.safetensors",
+ "model.layers.54.self_attn.k_norm.weight": "model-00055-of-00092.safetensors",
+ "model.layers.54.self_attn.k_proj.bias": "model-00055-of-00092.safetensors",
+ "model.layers.54.self_attn.k_proj.weight": "model-00055-of-00092.safetensors",
+ "model.layers.54.self_attn.k_proj.weight_scale": "model-00055-of-00092.safetensors",
+ "model.layers.54.self_attn.o_proj.weight": "model-00055-of-00092.safetensors",
+ "model.layers.54.self_attn.o_proj.weight_scale": "model-00055-of-00092.safetensors",
+ "model.layers.54.self_attn.q_norm.weight": "model-00055-of-00092.safetensors",
+ "model.layers.54.self_attn.q_proj.bias": "model-00055-of-00092.safetensors",
+ "model.layers.54.self_attn.q_proj.weight": "model-00055-of-00092.safetensors",
+ "model.layers.54.self_attn.q_proj.weight_scale": "model-00055-of-00092.safetensors",
+ "model.layers.54.self_attn.v_proj.bias": "model-00055-of-00092.safetensors",
+ "model.layers.54.self_attn.v_proj.weight": "model-00055-of-00092.safetensors",
+ "model.layers.54.self_attn.v_proj.weight_scale": "model-00055-of-00092.safetensors",
+ "model.layers.55.input_layernorm.weight": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.0.down_proj.weight": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.0.down_proj.weight_scale": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.0.gate_proj.weight": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.0.gate_proj.weight_scale": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.0.up_proj.weight": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.0.up_proj.weight_scale": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.1.down_proj.weight": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.1.down_proj.weight_scale": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.1.gate_proj.weight": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.1.gate_proj.weight_scale": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.1.up_proj.weight": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.1.up_proj.weight_scale": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.10.down_proj.weight": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.10.down_proj.weight_scale": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.10.gate_proj.weight": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.10.gate_proj.weight_scale": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.10.up_proj.weight": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.10.up_proj.weight_scale": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.100.down_proj.weight": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.100.down_proj.weight_scale": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.100.gate_proj.weight": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.100.gate_proj.weight_scale": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.100.up_proj.weight": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.100.up_proj.weight_scale": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.101.down_proj.weight": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.101.down_proj.weight_scale": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.101.gate_proj.weight": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.101.gate_proj.weight_scale": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.101.up_proj.weight": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.101.up_proj.weight_scale": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.102.down_proj.weight": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.102.down_proj.weight_scale": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.102.gate_proj.weight": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.102.gate_proj.weight_scale": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.102.up_proj.weight": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.102.up_proj.weight_scale": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.103.down_proj.weight": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.103.down_proj.weight_scale": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.103.gate_proj.weight": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.103.gate_proj.weight_scale": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.103.up_proj.weight": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.103.up_proj.weight_scale": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.104.down_proj.weight": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.104.down_proj.weight_scale": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.104.gate_proj.weight": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.104.gate_proj.weight_scale": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.104.up_proj.weight": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.104.up_proj.weight_scale": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.105.down_proj.weight": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.105.down_proj.weight_scale": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.105.gate_proj.weight": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.105.gate_proj.weight_scale": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.105.up_proj.weight": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.105.up_proj.weight_scale": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.106.down_proj.weight": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.106.down_proj.weight_scale": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.106.gate_proj.weight": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.106.gate_proj.weight_scale": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.106.up_proj.weight": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.106.up_proj.weight_scale": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.107.down_proj.weight": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.107.down_proj.weight_scale": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.107.gate_proj.weight": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.107.gate_proj.weight_scale": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.107.up_proj.weight": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.107.up_proj.weight_scale": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.108.down_proj.weight": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.108.down_proj.weight_scale": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.108.gate_proj.weight": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.108.gate_proj.weight_scale": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.108.up_proj.weight": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.108.up_proj.weight_scale": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.109.down_proj.weight": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.109.down_proj.weight_scale": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.109.gate_proj.weight": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.109.gate_proj.weight_scale": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.109.up_proj.weight": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.109.up_proj.weight_scale": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.11.down_proj.weight": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.11.down_proj.weight_scale": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.11.gate_proj.weight": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.11.gate_proj.weight_scale": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.11.up_proj.weight": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.11.up_proj.weight_scale": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.110.down_proj.weight": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.110.down_proj.weight_scale": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.110.gate_proj.weight": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.110.gate_proj.weight_scale": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.110.up_proj.weight": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.110.up_proj.weight_scale": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.111.down_proj.weight": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.111.down_proj.weight_scale": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.111.gate_proj.weight": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.111.gate_proj.weight_scale": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.111.up_proj.weight": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.111.up_proj.weight_scale": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.112.down_proj.weight": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.112.down_proj.weight_scale": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.112.gate_proj.weight": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.112.gate_proj.weight_scale": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.112.up_proj.weight": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.112.up_proj.weight_scale": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.113.down_proj.weight": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.113.down_proj.weight_scale": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.113.gate_proj.weight": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.113.gate_proj.weight_scale": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.113.up_proj.weight": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.113.up_proj.weight_scale": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.114.down_proj.weight": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.114.down_proj.weight_scale": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.114.gate_proj.weight": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.114.gate_proj.weight_scale": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.114.up_proj.weight": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.114.up_proj.weight_scale": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.115.down_proj.weight": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.115.down_proj.weight_scale": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.115.gate_proj.weight": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.115.gate_proj.weight_scale": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.115.up_proj.weight": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.115.up_proj.weight_scale": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.116.down_proj.weight": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.116.down_proj.weight_scale": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.116.gate_proj.weight": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.116.gate_proj.weight_scale": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.116.up_proj.weight": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.116.up_proj.weight_scale": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.117.down_proj.weight": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.117.down_proj.weight_scale": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.117.gate_proj.weight": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.117.gate_proj.weight_scale": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.117.up_proj.weight": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.117.up_proj.weight_scale": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.118.down_proj.weight": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.118.down_proj.weight_scale": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.118.gate_proj.weight": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.118.gate_proj.weight_scale": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.118.up_proj.weight": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.118.up_proj.weight_scale": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.119.down_proj.weight": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.119.down_proj.weight_scale": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.119.gate_proj.weight": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.119.gate_proj.weight_scale": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.119.up_proj.weight": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.119.up_proj.weight_scale": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.12.down_proj.weight": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.12.down_proj.weight_scale": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.12.gate_proj.weight": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.12.gate_proj.weight_scale": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.12.up_proj.weight": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.12.up_proj.weight_scale": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.120.down_proj.weight": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.120.down_proj.weight_scale": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.120.gate_proj.weight": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.120.gate_proj.weight_scale": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.120.up_proj.weight": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.120.up_proj.weight_scale": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.121.down_proj.weight": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.121.down_proj.weight_scale": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.121.gate_proj.weight": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.121.gate_proj.weight_scale": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.121.up_proj.weight": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.121.up_proj.weight_scale": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.122.down_proj.weight": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.122.down_proj.weight_scale": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.122.gate_proj.weight": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.122.gate_proj.weight_scale": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.122.up_proj.weight": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.122.up_proj.weight_scale": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.123.down_proj.weight": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.123.down_proj.weight_scale": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.123.gate_proj.weight": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.123.gate_proj.weight_scale": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.123.up_proj.weight": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.123.up_proj.weight_scale": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.124.down_proj.weight": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.124.down_proj.weight_scale": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.124.gate_proj.weight": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.124.gate_proj.weight_scale": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.124.up_proj.weight": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.124.up_proj.weight_scale": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.125.down_proj.weight": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.125.down_proj.weight_scale": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.125.gate_proj.weight": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.125.gate_proj.weight_scale": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.125.up_proj.weight": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.125.up_proj.weight_scale": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.126.down_proj.weight": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.126.down_proj.weight_scale": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.126.gate_proj.weight": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.126.gate_proj.weight_scale": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.126.up_proj.weight": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.126.up_proj.weight_scale": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.127.down_proj.weight": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.127.down_proj.weight_scale": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.127.gate_proj.weight": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.127.gate_proj.weight_scale": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.127.up_proj.weight": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.127.up_proj.weight_scale": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.128.down_proj.weight": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.128.down_proj.weight_scale": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.128.gate_proj.weight": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.128.gate_proj.weight_scale": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.128.up_proj.weight": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.128.up_proj.weight_scale": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.129.down_proj.weight": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.129.down_proj.weight_scale": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.129.gate_proj.weight": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.129.gate_proj.weight_scale": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.129.up_proj.weight": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.129.up_proj.weight_scale": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.13.down_proj.weight": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.13.down_proj.weight_scale": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.13.gate_proj.weight": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.13.gate_proj.weight_scale": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.13.up_proj.weight": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.13.up_proj.weight_scale": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.130.down_proj.weight": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.130.down_proj.weight_scale": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.130.gate_proj.weight": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.130.gate_proj.weight_scale": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.130.up_proj.weight": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.130.up_proj.weight_scale": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.131.down_proj.weight": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.131.down_proj.weight_scale": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.131.gate_proj.weight": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.131.gate_proj.weight_scale": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.131.up_proj.weight": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.131.up_proj.weight_scale": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.132.down_proj.weight": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.132.down_proj.weight_scale": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.132.gate_proj.weight": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.132.gate_proj.weight_scale": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.132.up_proj.weight": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.132.up_proj.weight_scale": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.133.down_proj.weight": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.133.down_proj.weight_scale": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.133.gate_proj.weight": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.133.gate_proj.weight_scale": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.133.up_proj.weight": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.133.up_proj.weight_scale": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.134.down_proj.weight": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.134.down_proj.weight_scale": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.134.gate_proj.weight": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.134.gate_proj.weight_scale": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.134.up_proj.weight": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.134.up_proj.weight_scale": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.135.down_proj.weight": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.135.down_proj.weight_scale": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.135.gate_proj.weight": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.135.gate_proj.weight_scale": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.135.up_proj.weight": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.135.up_proj.weight_scale": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.136.down_proj.weight": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.136.down_proj.weight_scale": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.136.gate_proj.weight": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.136.gate_proj.weight_scale": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.136.up_proj.weight": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.136.up_proj.weight_scale": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.137.down_proj.weight": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.137.down_proj.weight_scale": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.137.gate_proj.weight": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.137.gate_proj.weight_scale": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.137.up_proj.weight": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.137.up_proj.weight_scale": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.138.down_proj.weight": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.138.down_proj.weight_scale": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.138.gate_proj.weight": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.138.gate_proj.weight_scale": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.138.up_proj.weight": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.138.up_proj.weight_scale": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.139.down_proj.weight": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.139.down_proj.weight_scale": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.139.gate_proj.weight": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.139.gate_proj.weight_scale": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.139.up_proj.weight": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.139.up_proj.weight_scale": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.14.down_proj.weight": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.14.down_proj.weight_scale": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.14.gate_proj.weight": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.14.gate_proj.weight_scale": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.14.up_proj.weight": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.14.up_proj.weight_scale": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.140.down_proj.weight": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.140.down_proj.weight_scale": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.140.gate_proj.weight": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.140.gate_proj.weight_scale": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.140.up_proj.weight": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.140.up_proj.weight_scale": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.141.down_proj.weight": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.141.down_proj.weight_scale": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.141.gate_proj.weight": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.141.gate_proj.weight_scale": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.141.up_proj.weight": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.141.up_proj.weight_scale": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.142.down_proj.weight": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.142.down_proj.weight_scale": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.142.gate_proj.weight": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.142.gate_proj.weight_scale": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.142.up_proj.weight": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.142.up_proj.weight_scale": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.143.down_proj.weight": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.143.down_proj.weight_scale": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.143.gate_proj.weight": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.143.gate_proj.weight_scale": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.143.up_proj.weight": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.143.up_proj.weight_scale": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.144.down_proj.weight": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.144.down_proj.weight_scale": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.144.gate_proj.weight": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.144.gate_proj.weight_scale": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.144.up_proj.weight": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.144.up_proj.weight_scale": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.145.down_proj.weight": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.145.down_proj.weight_scale": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.145.gate_proj.weight": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.145.gate_proj.weight_scale": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.145.up_proj.weight": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.145.up_proj.weight_scale": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.146.down_proj.weight": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.146.down_proj.weight_scale": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.146.gate_proj.weight": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.146.gate_proj.weight_scale": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.146.up_proj.weight": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.146.up_proj.weight_scale": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.147.down_proj.weight": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.147.down_proj.weight_scale": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.147.gate_proj.weight": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.147.gate_proj.weight_scale": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.147.up_proj.weight": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.147.up_proj.weight_scale": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.148.down_proj.weight": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.148.down_proj.weight_scale": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.148.gate_proj.weight": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.148.gate_proj.weight_scale": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.148.up_proj.weight": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.148.up_proj.weight_scale": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.149.down_proj.weight": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.149.down_proj.weight_scale": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.149.gate_proj.weight": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.149.gate_proj.weight_scale": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.149.up_proj.weight": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.149.up_proj.weight_scale": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.15.down_proj.weight": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.15.down_proj.weight_scale": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.15.gate_proj.weight": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.15.gate_proj.weight_scale": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.15.up_proj.weight": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.15.up_proj.weight_scale": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.150.down_proj.weight": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.150.down_proj.weight_scale": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.150.gate_proj.weight": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.150.gate_proj.weight_scale": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.150.up_proj.weight": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.150.up_proj.weight_scale": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.151.down_proj.weight": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.151.down_proj.weight_scale": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.151.gate_proj.weight": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.151.gate_proj.weight_scale": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.151.up_proj.weight": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.151.up_proj.weight_scale": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.152.down_proj.weight": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.152.down_proj.weight_scale": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.152.gate_proj.weight": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.152.gate_proj.weight_scale": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.152.up_proj.weight": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.152.up_proj.weight_scale": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.153.down_proj.weight": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.153.down_proj.weight_scale": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.153.gate_proj.weight": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.153.gate_proj.weight_scale": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.153.up_proj.weight": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.153.up_proj.weight_scale": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.154.down_proj.weight": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.154.down_proj.weight_scale": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.154.gate_proj.weight": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.154.gate_proj.weight_scale": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.154.up_proj.weight": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.154.up_proj.weight_scale": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.155.down_proj.weight": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.155.down_proj.weight_scale": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.155.gate_proj.weight": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.155.gate_proj.weight_scale": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.155.up_proj.weight": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.155.up_proj.weight_scale": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.156.down_proj.weight": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.156.down_proj.weight_scale": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.156.gate_proj.weight": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.156.gate_proj.weight_scale": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.156.up_proj.weight": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.156.up_proj.weight_scale": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.157.down_proj.weight": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.157.down_proj.weight_scale": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.157.gate_proj.weight": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.157.gate_proj.weight_scale": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.157.up_proj.weight": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.157.up_proj.weight_scale": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.158.down_proj.weight": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.158.down_proj.weight_scale": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.158.gate_proj.weight": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.158.gate_proj.weight_scale": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.158.up_proj.weight": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.158.up_proj.weight_scale": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.159.down_proj.weight": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.159.down_proj.weight_scale": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.159.gate_proj.weight": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.159.gate_proj.weight_scale": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.159.up_proj.weight": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.159.up_proj.weight_scale": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.16.down_proj.weight": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.16.down_proj.weight_scale": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.16.gate_proj.weight": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.16.gate_proj.weight_scale": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.16.up_proj.weight": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.16.up_proj.weight_scale": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.17.down_proj.weight": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.17.down_proj.weight_scale": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.17.gate_proj.weight": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.17.gate_proj.weight_scale": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.17.up_proj.weight": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.17.up_proj.weight_scale": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.18.down_proj.weight": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.18.down_proj.weight_scale": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.18.gate_proj.weight": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.18.gate_proj.weight_scale": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.18.up_proj.weight": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.18.up_proj.weight_scale": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.19.down_proj.weight": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.19.down_proj.weight_scale": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.19.gate_proj.weight": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.19.gate_proj.weight_scale": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.19.up_proj.weight": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.19.up_proj.weight_scale": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.2.down_proj.weight": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.2.down_proj.weight_scale": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.2.gate_proj.weight": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.2.gate_proj.weight_scale": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.2.up_proj.weight": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.2.up_proj.weight_scale": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.20.down_proj.weight": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.20.down_proj.weight_scale": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.20.gate_proj.weight": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.20.gate_proj.weight_scale": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.20.up_proj.weight": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.20.up_proj.weight_scale": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.21.down_proj.weight": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.21.down_proj.weight_scale": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.21.gate_proj.weight": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.21.gate_proj.weight_scale": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.21.up_proj.weight": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.21.up_proj.weight_scale": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.22.down_proj.weight": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.22.down_proj.weight_scale": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.22.gate_proj.weight": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.22.gate_proj.weight_scale": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.22.up_proj.weight": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.22.up_proj.weight_scale": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.23.down_proj.weight": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.23.down_proj.weight_scale": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.23.gate_proj.weight": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.23.gate_proj.weight_scale": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.23.up_proj.weight": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.23.up_proj.weight_scale": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.24.down_proj.weight": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.24.down_proj.weight_scale": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.24.gate_proj.weight": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.24.gate_proj.weight_scale": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.24.up_proj.weight": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.24.up_proj.weight_scale": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.25.down_proj.weight": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.25.down_proj.weight_scale": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.25.gate_proj.weight": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.25.gate_proj.weight_scale": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.25.up_proj.weight": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.25.up_proj.weight_scale": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.26.down_proj.weight": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.26.down_proj.weight_scale": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.26.gate_proj.weight": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.26.gate_proj.weight_scale": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.26.up_proj.weight": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.26.up_proj.weight_scale": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.27.down_proj.weight": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.27.down_proj.weight_scale": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.27.gate_proj.weight": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.27.gate_proj.weight_scale": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.27.up_proj.weight": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.27.up_proj.weight_scale": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.28.down_proj.weight": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.28.down_proj.weight_scale": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.28.gate_proj.weight": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.28.gate_proj.weight_scale": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.28.up_proj.weight": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.28.up_proj.weight_scale": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.29.down_proj.weight": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.29.down_proj.weight_scale": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.29.gate_proj.weight": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.29.gate_proj.weight_scale": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.29.up_proj.weight": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.29.up_proj.weight_scale": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.3.down_proj.weight": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.3.down_proj.weight_scale": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.3.gate_proj.weight": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.3.gate_proj.weight_scale": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.3.up_proj.weight": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.3.up_proj.weight_scale": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.30.down_proj.weight": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.30.down_proj.weight_scale": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.30.gate_proj.weight": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.30.gate_proj.weight_scale": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.30.up_proj.weight": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.30.up_proj.weight_scale": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.31.down_proj.weight": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.31.down_proj.weight_scale": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.31.gate_proj.weight": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.31.gate_proj.weight_scale": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.31.up_proj.weight": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.31.up_proj.weight_scale": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.32.down_proj.weight": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.32.down_proj.weight_scale": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.32.gate_proj.weight": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.32.gate_proj.weight_scale": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.32.up_proj.weight": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.32.up_proj.weight_scale": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.33.down_proj.weight": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.33.down_proj.weight_scale": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.33.gate_proj.weight": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.33.gate_proj.weight_scale": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.33.up_proj.weight": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.33.up_proj.weight_scale": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.34.down_proj.weight": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.34.down_proj.weight_scale": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.34.gate_proj.weight": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.34.gate_proj.weight_scale": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.34.up_proj.weight": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.34.up_proj.weight_scale": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.35.down_proj.weight": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.35.down_proj.weight_scale": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.35.gate_proj.weight": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.35.gate_proj.weight_scale": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.35.up_proj.weight": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.35.up_proj.weight_scale": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.36.down_proj.weight": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.36.down_proj.weight_scale": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.36.gate_proj.weight": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.36.gate_proj.weight_scale": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.36.up_proj.weight": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.36.up_proj.weight_scale": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.37.down_proj.weight": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.37.down_proj.weight_scale": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.37.gate_proj.weight": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.37.gate_proj.weight_scale": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.37.up_proj.weight": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.37.up_proj.weight_scale": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.38.down_proj.weight": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.38.down_proj.weight_scale": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.38.gate_proj.weight": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.38.gate_proj.weight_scale": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.38.up_proj.weight": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.38.up_proj.weight_scale": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.39.down_proj.weight": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.39.down_proj.weight_scale": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.39.gate_proj.weight": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.39.gate_proj.weight_scale": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.39.up_proj.weight": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.39.up_proj.weight_scale": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.4.down_proj.weight": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.4.down_proj.weight_scale": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.4.gate_proj.weight": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.4.gate_proj.weight_scale": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.4.up_proj.weight": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.4.up_proj.weight_scale": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.40.down_proj.weight": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.40.down_proj.weight_scale": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.40.gate_proj.weight": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.40.gate_proj.weight_scale": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.40.up_proj.weight": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.40.up_proj.weight_scale": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.41.down_proj.weight": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.41.down_proj.weight_scale": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.41.gate_proj.weight": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.41.gate_proj.weight_scale": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.41.up_proj.weight": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.41.up_proj.weight_scale": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.42.down_proj.weight": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.42.down_proj.weight_scale": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.42.gate_proj.weight": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.42.gate_proj.weight_scale": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.42.up_proj.weight": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.42.up_proj.weight_scale": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.43.down_proj.weight": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.43.down_proj.weight_scale": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.43.gate_proj.weight": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.43.gate_proj.weight_scale": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.43.up_proj.weight": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.43.up_proj.weight_scale": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.44.down_proj.weight": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.44.down_proj.weight_scale": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.44.gate_proj.weight": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.44.gate_proj.weight_scale": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.44.up_proj.weight": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.44.up_proj.weight_scale": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.45.down_proj.weight": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.45.down_proj.weight_scale": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.45.gate_proj.weight": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.45.gate_proj.weight_scale": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.45.up_proj.weight": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.45.up_proj.weight_scale": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.46.down_proj.weight": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.46.down_proj.weight_scale": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.46.gate_proj.weight": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.46.gate_proj.weight_scale": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.46.up_proj.weight": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.46.up_proj.weight_scale": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.47.down_proj.weight": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.47.down_proj.weight_scale": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.47.gate_proj.weight": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.47.gate_proj.weight_scale": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.47.up_proj.weight": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.47.up_proj.weight_scale": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.48.down_proj.weight": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.48.down_proj.weight_scale": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.48.gate_proj.weight": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.48.gate_proj.weight_scale": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.48.up_proj.weight": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.48.up_proj.weight_scale": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.49.down_proj.weight": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.49.down_proj.weight_scale": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.49.gate_proj.weight": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.49.gate_proj.weight_scale": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.49.up_proj.weight": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.49.up_proj.weight_scale": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.5.down_proj.weight": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.5.down_proj.weight_scale": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.5.gate_proj.weight": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.5.gate_proj.weight_scale": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.5.up_proj.weight": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.5.up_proj.weight_scale": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.50.down_proj.weight": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.50.down_proj.weight_scale": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.50.gate_proj.weight": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.50.gate_proj.weight_scale": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.50.up_proj.weight": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.50.up_proj.weight_scale": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.51.down_proj.weight": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.51.down_proj.weight_scale": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.51.gate_proj.weight": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.51.gate_proj.weight_scale": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.51.up_proj.weight": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.51.up_proj.weight_scale": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.52.down_proj.weight": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.52.down_proj.weight_scale": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.52.gate_proj.weight": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.52.gate_proj.weight_scale": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.52.up_proj.weight": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.52.up_proj.weight_scale": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.53.down_proj.weight": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.53.down_proj.weight_scale": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.53.gate_proj.weight": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.53.gate_proj.weight_scale": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.53.up_proj.weight": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.53.up_proj.weight_scale": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.54.down_proj.weight": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.54.down_proj.weight_scale": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.54.gate_proj.weight": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.54.gate_proj.weight_scale": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.54.up_proj.weight": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.54.up_proj.weight_scale": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.55.down_proj.weight": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.55.down_proj.weight_scale": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.55.gate_proj.weight": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.55.gate_proj.weight_scale": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.55.up_proj.weight": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.55.up_proj.weight_scale": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.56.down_proj.weight": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.56.down_proj.weight_scale": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.56.gate_proj.weight": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.56.gate_proj.weight_scale": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.56.up_proj.weight": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.56.up_proj.weight_scale": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.57.down_proj.weight": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.57.down_proj.weight_scale": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.57.gate_proj.weight": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.57.gate_proj.weight_scale": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.57.up_proj.weight": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.57.up_proj.weight_scale": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.58.down_proj.weight": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.58.down_proj.weight_scale": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.58.gate_proj.weight": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.58.gate_proj.weight_scale": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.58.up_proj.weight": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.58.up_proj.weight_scale": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.59.down_proj.weight": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.59.down_proj.weight_scale": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.59.gate_proj.weight": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.59.gate_proj.weight_scale": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.59.up_proj.weight": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.59.up_proj.weight_scale": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.6.down_proj.weight": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.6.down_proj.weight_scale": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.6.gate_proj.weight": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.6.gate_proj.weight_scale": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.6.up_proj.weight": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.6.up_proj.weight_scale": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.60.down_proj.weight": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.60.down_proj.weight_scale": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.60.gate_proj.weight": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.60.gate_proj.weight_scale": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.60.up_proj.weight": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.60.up_proj.weight_scale": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.61.down_proj.weight": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.61.down_proj.weight_scale": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.61.gate_proj.weight": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.61.gate_proj.weight_scale": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.61.up_proj.weight": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.61.up_proj.weight_scale": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.62.down_proj.weight": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.62.down_proj.weight_scale": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.62.gate_proj.weight": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.62.gate_proj.weight_scale": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.62.up_proj.weight": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.62.up_proj.weight_scale": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.63.down_proj.weight": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.63.down_proj.weight_scale": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.63.gate_proj.weight": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.63.gate_proj.weight_scale": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.63.up_proj.weight": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.63.up_proj.weight_scale": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.64.down_proj.weight": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.64.down_proj.weight_scale": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.64.gate_proj.weight": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.64.gate_proj.weight_scale": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.64.up_proj.weight": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.64.up_proj.weight_scale": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.65.down_proj.weight": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.65.down_proj.weight_scale": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.65.gate_proj.weight": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.65.gate_proj.weight_scale": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.65.up_proj.weight": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.65.up_proj.weight_scale": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.66.down_proj.weight": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.66.down_proj.weight_scale": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.66.gate_proj.weight": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.66.gate_proj.weight_scale": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.66.up_proj.weight": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.66.up_proj.weight_scale": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.67.down_proj.weight": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.67.down_proj.weight_scale": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.67.gate_proj.weight": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.67.gate_proj.weight_scale": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.67.up_proj.weight": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.67.up_proj.weight_scale": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.68.down_proj.weight": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.68.down_proj.weight_scale": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.68.gate_proj.weight": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.68.gate_proj.weight_scale": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.68.up_proj.weight": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.68.up_proj.weight_scale": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.69.down_proj.weight": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.69.down_proj.weight_scale": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.69.gate_proj.weight": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.69.gate_proj.weight_scale": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.69.up_proj.weight": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.69.up_proj.weight_scale": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.7.down_proj.weight": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.7.down_proj.weight_scale": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.7.gate_proj.weight": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.7.gate_proj.weight_scale": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.7.up_proj.weight": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.7.up_proj.weight_scale": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.70.down_proj.weight": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.70.down_proj.weight_scale": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.70.gate_proj.weight": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.70.gate_proj.weight_scale": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.70.up_proj.weight": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.70.up_proj.weight_scale": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.71.down_proj.weight": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.71.down_proj.weight_scale": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.71.gate_proj.weight": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.71.gate_proj.weight_scale": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.71.up_proj.weight": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.71.up_proj.weight_scale": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.72.down_proj.weight": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.72.down_proj.weight_scale": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.72.gate_proj.weight": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.72.gate_proj.weight_scale": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.72.up_proj.weight": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.72.up_proj.weight_scale": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.73.down_proj.weight": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.73.down_proj.weight_scale": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.73.gate_proj.weight": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.73.gate_proj.weight_scale": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.73.up_proj.weight": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.73.up_proj.weight_scale": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.74.down_proj.weight": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.74.down_proj.weight_scale": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.74.gate_proj.weight": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.74.gate_proj.weight_scale": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.74.up_proj.weight": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.74.up_proj.weight_scale": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.75.down_proj.weight": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.75.down_proj.weight_scale": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.75.gate_proj.weight": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.75.gate_proj.weight_scale": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.75.up_proj.weight": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.75.up_proj.weight_scale": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.76.down_proj.weight": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.76.down_proj.weight_scale": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.76.gate_proj.weight": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.76.gate_proj.weight_scale": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.76.up_proj.weight": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.76.up_proj.weight_scale": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.77.down_proj.weight": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.77.down_proj.weight_scale": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.77.gate_proj.weight": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.77.gate_proj.weight_scale": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.77.up_proj.weight": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.77.up_proj.weight_scale": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.78.down_proj.weight": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.78.down_proj.weight_scale": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.78.gate_proj.weight": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.78.gate_proj.weight_scale": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.78.up_proj.weight": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.78.up_proj.weight_scale": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.79.down_proj.weight": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.79.down_proj.weight_scale": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.79.gate_proj.weight": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.79.gate_proj.weight_scale": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.79.up_proj.weight": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.79.up_proj.weight_scale": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.8.down_proj.weight": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.8.down_proj.weight_scale": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.8.gate_proj.weight": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.8.gate_proj.weight_scale": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.8.up_proj.weight": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.8.up_proj.weight_scale": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.80.down_proj.weight": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.80.down_proj.weight_scale": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.80.gate_proj.weight": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.80.gate_proj.weight_scale": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.80.up_proj.weight": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.80.up_proj.weight_scale": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.81.down_proj.weight": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.81.down_proj.weight_scale": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.81.gate_proj.weight": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.81.gate_proj.weight_scale": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.81.up_proj.weight": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.81.up_proj.weight_scale": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.82.down_proj.weight": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.82.down_proj.weight_scale": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.82.gate_proj.weight": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.82.gate_proj.weight_scale": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.82.up_proj.weight": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.82.up_proj.weight_scale": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.83.down_proj.weight": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.83.down_proj.weight_scale": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.83.gate_proj.weight": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.83.gate_proj.weight_scale": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.83.up_proj.weight": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.83.up_proj.weight_scale": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.84.down_proj.weight": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.84.down_proj.weight_scale": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.84.gate_proj.weight": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.84.gate_proj.weight_scale": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.84.up_proj.weight": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.84.up_proj.weight_scale": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.85.down_proj.weight": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.85.down_proj.weight_scale": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.85.gate_proj.weight": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.85.gate_proj.weight_scale": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.85.up_proj.weight": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.85.up_proj.weight_scale": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.86.down_proj.weight": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.86.down_proj.weight_scale": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.86.gate_proj.weight": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.86.gate_proj.weight_scale": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.86.up_proj.weight": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.86.up_proj.weight_scale": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.87.down_proj.weight": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.87.down_proj.weight_scale": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.87.gate_proj.weight": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.87.gate_proj.weight_scale": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.87.up_proj.weight": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.87.up_proj.weight_scale": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.88.down_proj.weight": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.88.down_proj.weight_scale": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.88.gate_proj.weight": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.88.gate_proj.weight_scale": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.88.up_proj.weight": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.88.up_proj.weight_scale": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.89.down_proj.weight": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.89.down_proj.weight_scale": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.89.gate_proj.weight": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.89.gate_proj.weight_scale": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.89.up_proj.weight": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.89.up_proj.weight_scale": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.9.down_proj.weight": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.9.down_proj.weight_scale": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.9.gate_proj.weight": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.9.gate_proj.weight_scale": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.9.up_proj.weight": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.9.up_proj.weight_scale": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.90.down_proj.weight": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.90.down_proj.weight_scale": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.90.gate_proj.weight": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.90.gate_proj.weight_scale": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.90.up_proj.weight": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.90.up_proj.weight_scale": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.91.down_proj.weight": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.91.down_proj.weight_scale": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.91.gate_proj.weight": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.91.gate_proj.weight_scale": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.91.up_proj.weight": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.91.up_proj.weight_scale": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.92.down_proj.weight": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.92.down_proj.weight_scale": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.92.gate_proj.weight": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.92.gate_proj.weight_scale": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.92.up_proj.weight": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.92.up_proj.weight_scale": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.93.down_proj.weight": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.93.down_proj.weight_scale": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.93.gate_proj.weight": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.93.gate_proj.weight_scale": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.93.up_proj.weight": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.93.up_proj.weight_scale": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.94.down_proj.weight": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.94.down_proj.weight_scale": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.94.gate_proj.weight": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.94.gate_proj.weight_scale": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.94.up_proj.weight": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.94.up_proj.weight_scale": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.95.down_proj.weight": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.95.down_proj.weight_scale": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.95.gate_proj.weight": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.95.gate_proj.weight_scale": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.95.up_proj.weight": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.95.up_proj.weight_scale": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.96.down_proj.weight": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.96.down_proj.weight_scale": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.96.gate_proj.weight": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.96.gate_proj.weight_scale": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.96.up_proj.weight": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.96.up_proj.weight_scale": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.97.down_proj.weight": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.97.down_proj.weight_scale": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.97.gate_proj.weight": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.97.gate_proj.weight_scale": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.97.up_proj.weight": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.97.up_proj.weight_scale": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.98.down_proj.weight": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.98.down_proj.weight_scale": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.98.gate_proj.weight": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.98.gate_proj.weight_scale": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.98.up_proj.weight": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.98.up_proj.weight_scale": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.99.down_proj.weight": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.99.down_proj.weight_scale": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.99.gate_proj.weight": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.99.gate_proj.weight_scale": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.99.up_proj.weight": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.99.up_proj.weight_scale": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.gate.e_score_correction_bias": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.gate.weight": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.shared_experts.down_proj.weight": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.shared_experts.down_proj.weight_scale": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.shared_experts.gate_proj.weight": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.shared_experts.gate_proj.weight_scale": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.shared_experts.up_proj.weight": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.shared_experts.up_proj.weight_scale": "model-00056-of-00092.safetensors",
+ "model.layers.55.post_attention_layernorm.weight": "model-00056-of-00092.safetensors",
+ "model.layers.55.self_attn.k_norm.weight": "model-00056-of-00092.safetensors",
+ "model.layers.55.self_attn.k_proj.bias": "model-00056-of-00092.safetensors",
+ "model.layers.55.self_attn.k_proj.weight": "model-00056-of-00092.safetensors",
+ "model.layers.55.self_attn.k_proj.weight_scale": "model-00056-of-00092.safetensors",
+ "model.layers.55.self_attn.o_proj.weight": "model-00056-of-00092.safetensors",
+ "model.layers.55.self_attn.o_proj.weight_scale": "model-00056-of-00092.safetensors",
+ "model.layers.55.self_attn.q_norm.weight": "model-00056-of-00092.safetensors",
+ "model.layers.55.self_attn.q_proj.bias": "model-00056-of-00092.safetensors",
+ "model.layers.55.self_attn.q_proj.weight": "model-00056-of-00092.safetensors",
+ "model.layers.55.self_attn.q_proj.weight_scale": "model-00056-of-00092.safetensors",
+ "model.layers.55.self_attn.v_proj.bias": "model-00056-of-00092.safetensors",
+ "model.layers.55.self_attn.v_proj.weight": "model-00056-of-00092.safetensors",
+ "model.layers.55.self_attn.v_proj.weight_scale": "model-00056-of-00092.safetensors",
+ "model.layers.56.input_layernorm.weight": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.0.down_proj.weight": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.0.down_proj.weight_scale": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.0.gate_proj.weight": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.0.gate_proj.weight_scale": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.0.up_proj.weight": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.0.up_proj.weight_scale": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.1.down_proj.weight": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.1.down_proj.weight_scale": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.1.gate_proj.weight": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.1.gate_proj.weight_scale": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.1.up_proj.weight": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.1.up_proj.weight_scale": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.10.down_proj.weight": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.10.down_proj.weight_scale": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.10.gate_proj.weight": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.10.gate_proj.weight_scale": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.10.up_proj.weight": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.10.up_proj.weight_scale": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.100.down_proj.weight": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.100.down_proj.weight_scale": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.100.gate_proj.weight": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.100.gate_proj.weight_scale": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.100.up_proj.weight": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.100.up_proj.weight_scale": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.101.down_proj.weight": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.101.down_proj.weight_scale": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.101.gate_proj.weight": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.101.gate_proj.weight_scale": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.101.up_proj.weight": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.101.up_proj.weight_scale": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.102.down_proj.weight": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.102.down_proj.weight_scale": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.102.gate_proj.weight": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.102.gate_proj.weight_scale": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.102.up_proj.weight": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.102.up_proj.weight_scale": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.103.down_proj.weight": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.103.down_proj.weight_scale": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.103.gate_proj.weight": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.103.gate_proj.weight_scale": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.103.up_proj.weight": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.103.up_proj.weight_scale": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.104.down_proj.weight": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.104.down_proj.weight_scale": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.104.gate_proj.weight": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.104.gate_proj.weight_scale": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.104.up_proj.weight": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.104.up_proj.weight_scale": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.105.down_proj.weight": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.105.down_proj.weight_scale": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.105.gate_proj.weight": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.105.gate_proj.weight_scale": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.105.up_proj.weight": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.105.up_proj.weight_scale": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.106.down_proj.weight": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.106.down_proj.weight_scale": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.106.gate_proj.weight": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.106.gate_proj.weight_scale": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.106.up_proj.weight": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.106.up_proj.weight_scale": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.107.down_proj.weight": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.107.down_proj.weight_scale": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.107.gate_proj.weight": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.107.gate_proj.weight_scale": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.107.up_proj.weight": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.107.up_proj.weight_scale": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.108.down_proj.weight": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.108.down_proj.weight_scale": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.108.gate_proj.weight": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.108.gate_proj.weight_scale": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.108.up_proj.weight": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.108.up_proj.weight_scale": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.109.down_proj.weight": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.109.down_proj.weight_scale": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.109.gate_proj.weight": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.109.gate_proj.weight_scale": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.109.up_proj.weight": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.109.up_proj.weight_scale": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.11.down_proj.weight": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.11.down_proj.weight_scale": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.11.gate_proj.weight": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.11.gate_proj.weight_scale": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.11.up_proj.weight": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.11.up_proj.weight_scale": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.110.down_proj.weight": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.110.down_proj.weight_scale": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.110.gate_proj.weight": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.110.gate_proj.weight_scale": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.110.up_proj.weight": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.110.up_proj.weight_scale": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.111.down_proj.weight": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.111.down_proj.weight_scale": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.111.gate_proj.weight": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.111.gate_proj.weight_scale": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.111.up_proj.weight": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.111.up_proj.weight_scale": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.112.down_proj.weight": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.112.down_proj.weight_scale": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.112.gate_proj.weight": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.112.gate_proj.weight_scale": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.112.up_proj.weight": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.112.up_proj.weight_scale": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.113.down_proj.weight": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.113.down_proj.weight_scale": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.113.gate_proj.weight": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.113.gate_proj.weight_scale": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.113.up_proj.weight": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.113.up_proj.weight_scale": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.114.down_proj.weight": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.114.down_proj.weight_scale": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.114.gate_proj.weight": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.114.gate_proj.weight_scale": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.114.up_proj.weight": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.114.up_proj.weight_scale": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.115.down_proj.weight": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.115.down_proj.weight_scale": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.115.gate_proj.weight": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.115.gate_proj.weight_scale": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.115.up_proj.weight": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.115.up_proj.weight_scale": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.116.down_proj.weight": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.116.down_proj.weight_scale": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.116.gate_proj.weight": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.116.gate_proj.weight_scale": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.116.up_proj.weight": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.116.up_proj.weight_scale": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.117.down_proj.weight": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.117.down_proj.weight_scale": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.117.gate_proj.weight": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.117.gate_proj.weight_scale": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.117.up_proj.weight": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.117.up_proj.weight_scale": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.118.down_proj.weight": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.118.down_proj.weight_scale": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.118.gate_proj.weight": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.118.gate_proj.weight_scale": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.118.up_proj.weight": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.118.up_proj.weight_scale": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.119.down_proj.weight": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.119.down_proj.weight_scale": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.119.gate_proj.weight": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.119.gate_proj.weight_scale": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.119.up_proj.weight": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.119.up_proj.weight_scale": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.12.down_proj.weight": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.12.down_proj.weight_scale": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.12.gate_proj.weight": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.12.gate_proj.weight_scale": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.12.up_proj.weight": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.12.up_proj.weight_scale": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.120.down_proj.weight": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.120.down_proj.weight_scale": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.120.gate_proj.weight": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.120.gate_proj.weight_scale": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.120.up_proj.weight": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.120.up_proj.weight_scale": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.121.down_proj.weight": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.121.down_proj.weight_scale": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.121.gate_proj.weight": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.121.gate_proj.weight_scale": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.121.up_proj.weight": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.121.up_proj.weight_scale": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.122.down_proj.weight": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.122.down_proj.weight_scale": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.122.gate_proj.weight": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.122.gate_proj.weight_scale": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.122.up_proj.weight": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.122.up_proj.weight_scale": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.123.down_proj.weight": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.123.down_proj.weight_scale": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.123.gate_proj.weight": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.123.gate_proj.weight_scale": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.123.up_proj.weight": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.123.up_proj.weight_scale": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.124.down_proj.weight": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.124.down_proj.weight_scale": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.124.gate_proj.weight": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.124.gate_proj.weight_scale": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.124.up_proj.weight": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.124.up_proj.weight_scale": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.125.down_proj.weight": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.125.down_proj.weight_scale": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.125.gate_proj.weight": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.125.gate_proj.weight_scale": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.125.up_proj.weight": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.125.up_proj.weight_scale": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.126.down_proj.weight": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.126.down_proj.weight_scale": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.126.gate_proj.weight": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.126.gate_proj.weight_scale": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.126.up_proj.weight": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.126.up_proj.weight_scale": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.127.down_proj.weight": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.127.down_proj.weight_scale": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.127.gate_proj.weight": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.127.gate_proj.weight_scale": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.127.up_proj.weight": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.127.up_proj.weight_scale": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.128.down_proj.weight": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.128.down_proj.weight_scale": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.128.gate_proj.weight": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.128.gate_proj.weight_scale": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.128.up_proj.weight": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.128.up_proj.weight_scale": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.129.down_proj.weight": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.129.down_proj.weight_scale": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.129.gate_proj.weight": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.129.gate_proj.weight_scale": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.129.up_proj.weight": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.129.up_proj.weight_scale": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.13.down_proj.weight": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.13.down_proj.weight_scale": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.13.gate_proj.weight": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.13.gate_proj.weight_scale": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.13.up_proj.weight": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.13.up_proj.weight_scale": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.130.down_proj.weight": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.130.down_proj.weight_scale": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.130.gate_proj.weight": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.130.gate_proj.weight_scale": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.130.up_proj.weight": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.130.up_proj.weight_scale": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.131.down_proj.weight": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.131.down_proj.weight_scale": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.131.gate_proj.weight": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.131.gate_proj.weight_scale": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.131.up_proj.weight": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.131.up_proj.weight_scale": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.132.down_proj.weight": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.132.down_proj.weight_scale": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.132.gate_proj.weight": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.132.gate_proj.weight_scale": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.132.up_proj.weight": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.132.up_proj.weight_scale": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.133.down_proj.weight": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.133.down_proj.weight_scale": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.133.gate_proj.weight": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.133.gate_proj.weight_scale": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.133.up_proj.weight": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.133.up_proj.weight_scale": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.134.down_proj.weight": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.134.down_proj.weight_scale": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.134.gate_proj.weight": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.134.gate_proj.weight_scale": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.134.up_proj.weight": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.134.up_proj.weight_scale": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.135.down_proj.weight": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.135.down_proj.weight_scale": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.135.gate_proj.weight": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.135.gate_proj.weight_scale": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.135.up_proj.weight": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.135.up_proj.weight_scale": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.136.down_proj.weight": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.136.down_proj.weight_scale": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.136.gate_proj.weight": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.136.gate_proj.weight_scale": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.136.up_proj.weight": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.136.up_proj.weight_scale": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.137.down_proj.weight": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.137.down_proj.weight_scale": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.137.gate_proj.weight": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.137.gate_proj.weight_scale": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.137.up_proj.weight": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.137.up_proj.weight_scale": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.138.down_proj.weight": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.138.down_proj.weight_scale": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.138.gate_proj.weight": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.138.gate_proj.weight_scale": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.138.up_proj.weight": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.138.up_proj.weight_scale": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.139.down_proj.weight": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.139.down_proj.weight_scale": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.139.gate_proj.weight": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.139.gate_proj.weight_scale": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.139.up_proj.weight": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.139.up_proj.weight_scale": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.14.down_proj.weight": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.14.down_proj.weight_scale": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.14.gate_proj.weight": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.14.gate_proj.weight_scale": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.14.up_proj.weight": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.14.up_proj.weight_scale": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.140.down_proj.weight": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.140.down_proj.weight_scale": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.140.gate_proj.weight": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.140.gate_proj.weight_scale": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.140.up_proj.weight": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.140.up_proj.weight_scale": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.141.down_proj.weight": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.141.down_proj.weight_scale": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.141.gate_proj.weight": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.141.gate_proj.weight_scale": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.141.up_proj.weight": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.141.up_proj.weight_scale": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.142.down_proj.weight": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.142.down_proj.weight_scale": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.142.gate_proj.weight": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.142.gate_proj.weight_scale": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.142.up_proj.weight": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.142.up_proj.weight_scale": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.143.down_proj.weight": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.143.down_proj.weight_scale": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.143.gate_proj.weight": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.143.gate_proj.weight_scale": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.143.up_proj.weight": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.143.up_proj.weight_scale": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.144.down_proj.weight": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.144.down_proj.weight_scale": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.144.gate_proj.weight": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.144.gate_proj.weight_scale": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.144.up_proj.weight": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.144.up_proj.weight_scale": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.145.down_proj.weight": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.145.down_proj.weight_scale": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.145.gate_proj.weight": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.145.gate_proj.weight_scale": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.145.up_proj.weight": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.145.up_proj.weight_scale": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.146.down_proj.weight": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.146.down_proj.weight_scale": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.146.gate_proj.weight": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.146.gate_proj.weight_scale": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.146.up_proj.weight": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.146.up_proj.weight_scale": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.147.down_proj.weight": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.147.down_proj.weight_scale": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.147.gate_proj.weight": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.147.gate_proj.weight_scale": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.147.up_proj.weight": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.147.up_proj.weight_scale": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.148.down_proj.weight": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.148.down_proj.weight_scale": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.148.gate_proj.weight": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.148.gate_proj.weight_scale": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.148.up_proj.weight": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.148.up_proj.weight_scale": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.149.down_proj.weight": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.149.down_proj.weight_scale": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.149.gate_proj.weight": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.149.gate_proj.weight_scale": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.149.up_proj.weight": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.149.up_proj.weight_scale": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.15.down_proj.weight": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.15.down_proj.weight_scale": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.15.gate_proj.weight": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.15.gate_proj.weight_scale": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.15.up_proj.weight": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.15.up_proj.weight_scale": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.150.down_proj.weight": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.150.down_proj.weight_scale": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.150.gate_proj.weight": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.150.gate_proj.weight_scale": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.150.up_proj.weight": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.150.up_proj.weight_scale": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.151.down_proj.weight": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.151.down_proj.weight_scale": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.151.gate_proj.weight": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.151.gate_proj.weight_scale": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.151.up_proj.weight": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.151.up_proj.weight_scale": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.152.down_proj.weight": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.152.down_proj.weight_scale": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.152.gate_proj.weight": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.152.gate_proj.weight_scale": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.152.up_proj.weight": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.152.up_proj.weight_scale": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.153.down_proj.weight": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.153.down_proj.weight_scale": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.153.gate_proj.weight": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.153.gate_proj.weight_scale": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.153.up_proj.weight": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.153.up_proj.weight_scale": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.154.down_proj.weight": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.154.down_proj.weight_scale": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.154.gate_proj.weight": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.154.gate_proj.weight_scale": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.154.up_proj.weight": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.154.up_proj.weight_scale": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.155.down_proj.weight": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.155.down_proj.weight_scale": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.155.gate_proj.weight": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.155.gate_proj.weight_scale": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.155.up_proj.weight": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.155.up_proj.weight_scale": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.156.down_proj.weight": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.156.down_proj.weight_scale": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.156.gate_proj.weight": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.156.gate_proj.weight_scale": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.156.up_proj.weight": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.156.up_proj.weight_scale": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.157.down_proj.weight": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.157.down_proj.weight_scale": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.157.gate_proj.weight": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.157.gate_proj.weight_scale": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.157.up_proj.weight": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.157.up_proj.weight_scale": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.158.down_proj.weight": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.158.down_proj.weight_scale": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.158.gate_proj.weight": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.158.gate_proj.weight_scale": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.158.up_proj.weight": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.158.up_proj.weight_scale": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.159.down_proj.weight": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.159.down_proj.weight_scale": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.159.gate_proj.weight": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.159.gate_proj.weight_scale": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.159.up_proj.weight": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.159.up_proj.weight_scale": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.16.down_proj.weight": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.16.down_proj.weight_scale": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.16.gate_proj.weight": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.16.gate_proj.weight_scale": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.16.up_proj.weight": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.16.up_proj.weight_scale": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.17.down_proj.weight": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.17.down_proj.weight_scale": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.17.gate_proj.weight": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.17.gate_proj.weight_scale": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.17.up_proj.weight": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.17.up_proj.weight_scale": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.18.down_proj.weight": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.18.down_proj.weight_scale": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.18.gate_proj.weight": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.18.gate_proj.weight_scale": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.18.up_proj.weight": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.18.up_proj.weight_scale": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.19.down_proj.weight": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.19.down_proj.weight_scale": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.19.gate_proj.weight": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.19.gate_proj.weight_scale": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.19.up_proj.weight": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.19.up_proj.weight_scale": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.2.down_proj.weight": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.2.down_proj.weight_scale": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.2.gate_proj.weight": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.2.gate_proj.weight_scale": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.2.up_proj.weight": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.2.up_proj.weight_scale": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.20.down_proj.weight": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.20.down_proj.weight_scale": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.20.gate_proj.weight": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.20.gate_proj.weight_scale": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.20.up_proj.weight": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.20.up_proj.weight_scale": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.21.down_proj.weight": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.21.down_proj.weight_scale": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.21.gate_proj.weight": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.21.gate_proj.weight_scale": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.21.up_proj.weight": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.21.up_proj.weight_scale": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.22.down_proj.weight": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.22.down_proj.weight_scale": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.22.gate_proj.weight": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.22.gate_proj.weight_scale": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.22.up_proj.weight": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.22.up_proj.weight_scale": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.23.down_proj.weight": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.23.down_proj.weight_scale": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.23.gate_proj.weight": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.23.gate_proj.weight_scale": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.23.up_proj.weight": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.23.up_proj.weight_scale": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.24.down_proj.weight": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.24.down_proj.weight_scale": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.24.gate_proj.weight": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.24.gate_proj.weight_scale": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.24.up_proj.weight": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.24.up_proj.weight_scale": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.25.down_proj.weight": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.25.down_proj.weight_scale": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.25.gate_proj.weight": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.25.gate_proj.weight_scale": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.25.up_proj.weight": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.25.up_proj.weight_scale": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.26.down_proj.weight": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.26.down_proj.weight_scale": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.26.gate_proj.weight": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.26.gate_proj.weight_scale": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.26.up_proj.weight": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.26.up_proj.weight_scale": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.27.down_proj.weight": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.27.down_proj.weight_scale": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.27.gate_proj.weight": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.27.gate_proj.weight_scale": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.27.up_proj.weight": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.27.up_proj.weight_scale": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.28.down_proj.weight": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.28.down_proj.weight_scale": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.28.gate_proj.weight": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.28.gate_proj.weight_scale": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.28.up_proj.weight": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.28.up_proj.weight_scale": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.29.down_proj.weight": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.29.down_proj.weight_scale": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.29.gate_proj.weight": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.29.gate_proj.weight_scale": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.29.up_proj.weight": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.29.up_proj.weight_scale": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.3.down_proj.weight": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.3.down_proj.weight_scale": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.3.gate_proj.weight": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.3.gate_proj.weight_scale": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.3.up_proj.weight": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.3.up_proj.weight_scale": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.30.down_proj.weight": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.30.down_proj.weight_scale": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.30.gate_proj.weight": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.30.gate_proj.weight_scale": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.30.up_proj.weight": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.30.up_proj.weight_scale": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.31.down_proj.weight": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.31.down_proj.weight_scale": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.31.gate_proj.weight": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.31.gate_proj.weight_scale": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.31.up_proj.weight": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.31.up_proj.weight_scale": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.32.down_proj.weight": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.32.down_proj.weight_scale": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.32.gate_proj.weight": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.32.gate_proj.weight_scale": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.32.up_proj.weight": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.32.up_proj.weight_scale": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.33.down_proj.weight": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.33.down_proj.weight_scale": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.33.gate_proj.weight": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.33.gate_proj.weight_scale": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.33.up_proj.weight": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.33.up_proj.weight_scale": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.34.down_proj.weight": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.34.down_proj.weight_scale": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.34.gate_proj.weight": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.34.gate_proj.weight_scale": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.34.up_proj.weight": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.34.up_proj.weight_scale": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.35.down_proj.weight": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.35.down_proj.weight_scale": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.35.gate_proj.weight": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.35.gate_proj.weight_scale": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.35.up_proj.weight": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.35.up_proj.weight_scale": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.36.down_proj.weight": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.36.down_proj.weight_scale": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.36.gate_proj.weight": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.36.gate_proj.weight_scale": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.36.up_proj.weight": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.36.up_proj.weight_scale": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.37.down_proj.weight": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.37.down_proj.weight_scale": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.37.gate_proj.weight": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.37.gate_proj.weight_scale": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.37.up_proj.weight": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.37.up_proj.weight_scale": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.38.down_proj.weight": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.38.down_proj.weight_scale": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.38.gate_proj.weight": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.38.gate_proj.weight_scale": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.38.up_proj.weight": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.38.up_proj.weight_scale": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.39.down_proj.weight": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.39.down_proj.weight_scale": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.39.gate_proj.weight": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.39.gate_proj.weight_scale": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.39.up_proj.weight": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.39.up_proj.weight_scale": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.4.down_proj.weight": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.4.down_proj.weight_scale": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.4.gate_proj.weight": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.4.gate_proj.weight_scale": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.4.up_proj.weight": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.4.up_proj.weight_scale": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.40.down_proj.weight": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.40.down_proj.weight_scale": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.40.gate_proj.weight": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.40.gate_proj.weight_scale": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.40.up_proj.weight": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.40.up_proj.weight_scale": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.41.down_proj.weight": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.41.down_proj.weight_scale": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.41.gate_proj.weight": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.41.gate_proj.weight_scale": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.41.up_proj.weight": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.41.up_proj.weight_scale": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.42.down_proj.weight": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.42.down_proj.weight_scale": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.42.gate_proj.weight": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.42.gate_proj.weight_scale": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.42.up_proj.weight": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.42.up_proj.weight_scale": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.43.down_proj.weight": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.43.down_proj.weight_scale": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.43.gate_proj.weight": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.43.gate_proj.weight_scale": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.43.up_proj.weight": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.43.up_proj.weight_scale": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.44.down_proj.weight": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.44.down_proj.weight_scale": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.44.gate_proj.weight": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.44.gate_proj.weight_scale": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.44.up_proj.weight": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.44.up_proj.weight_scale": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.45.down_proj.weight": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.45.down_proj.weight_scale": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.45.gate_proj.weight": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.45.gate_proj.weight_scale": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.45.up_proj.weight": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.45.up_proj.weight_scale": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.46.down_proj.weight": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.46.down_proj.weight_scale": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.46.gate_proj.weight": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.46.gate_proj.weight_scale": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.46.up_proj.weight": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.46.up_proj.weight_scale": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.47.down_proj.weight": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.47.down_proj.weight_scale": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.47.gate_proj.weight": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.47.gate_proj.weight_scale": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.47.up_proj.weight": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.47.up_proj.weight_scale": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.48.down_proj.weight": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.48.down_proj.weight_scale": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.48.gate_proj.weight": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.48.gate_proj.weight_scale": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.48.up_proj.weight": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.48.up_proj.weight_scale": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.49.down_proj.weight": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.49.down_proj.weight_scale": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.49.gate_proj.weight": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.49.gate_proj.weight_scale": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.49.up_proj.weight": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.49.up_proj.weight_scale": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.5.down_proj.weight": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.5.down_proj.weight_scale": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.5.gate_proj.weight": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.5.gate_proj.weight_scale": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.5.up_proj.weight": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.5.up_proj.weight_scale": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.50.down_proj.weight": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.50.down_proj.weight_scale": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.50.gate_proj.weight": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.50.gate_proj.weight_scale": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.50.up_proj.weight": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.50.up_proj.weight_scale": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.51.down_proj.weight": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.51.down_proj.weight_scale": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.51.gate_proj.weight": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.51.gate_proj.weight_scale": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.51.up_proj.weight": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.51.up_proj.weight_scale": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.52.down_proj.weight": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.52.down_proj.weight_scale": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.52.gate_proj.weight": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.52.gate_proj.weight_scale": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.52.up_proj.weight": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.52.up_proj.weight_scale": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.53.down_proj.weight": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.53.down_proj.weight_scale": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.53.gate_proj.weight": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.53.gate_proj.weight_scale": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.53.up_proj.weight": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.53.up_proj.weight_scale": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.54.down_proj.weight": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.54.down_proj.weight_scale": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.54.gate_proj.weight": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.54.gate_proj.weight_scale": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.54.up_proj.weight": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.54.up_proj.weight_scale": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.55.down_proj.weight": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.55.down_proj.weight_scale": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.55.gate_proj.weight": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.55.gate_proj.weight_scale": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.55.up_proj.weight": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.55.up_proj.weight_scale": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.56.down_proj.weight": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.56.down_proj.weight_scale": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.56.gate_proj.weight": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.56.gate_proj.weight_scale": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.56.up_proj.weight": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.56.up_proj.weight_scale": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.57.down_proj.weight": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.57.down_proj.weight_scale": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.57.gate_proj.weight": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.57.gate_proj.weight_scale": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.57.up_proj.weight": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.57.up_proj.weight_scale": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.58.down_proj.weight": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.58.down_proj.weight_scale": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.58.gate_proj.weight": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.58.gate_proj.weight_scale": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.58.up_proj.weight": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.58.up_proj.weight_scale": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.59.down_proj.weight": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.59.down_proj.weight_scale": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.59.gate_proj.weight": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.59.gate_proj.weight_scale": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.59.up_proj.weight": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.59.up_proj.weight_scale": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.6.down_proj.weight": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.6.down_proj.weight_scale": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.6.gate_proj.weight": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.6.gate_proj.weight_scale": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.6.up_proj.weight": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.6.up_proj.weight_scale": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.60.down_proj.weight": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.60.down_proj.weight_scale": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.60.gate_proj.weight": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.60.gate_proj.weight_scale": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.60.up_proj.weight": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.60.up_proj.weight_scale": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.61.down_proj.weight": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.61.down_proj.weight_scale": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.61.gate_proj.weight": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.61.gate_proj.weight_scale": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.61.up_proj.weight": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.61.up_proj.weight_scale": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.62.down_proj.weight": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.62.down_proj.weight_scale": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.62.gate_proj.weight": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.62.gate_proj.weight_scale": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.62.up_proj.weight": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.62.up_proj.weight_scale": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.63.down_proj.weight": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.63.down_proj.weight_scale": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.63.gate_proj.weight": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.63.gate_proj.weight_scale": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.63.up_proj.weight": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.63.up_proj.weight_scale": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.64.down_proj.weight": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.64.down_proj.weight_scale": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.64.gate_proj.weight": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.64.gate_proj.weight_scale": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.64.up_proj.weight": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.64.up_proj.weight_scale": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.65.down_proj.weight": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.65.down_proj.weight_scale": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.65.gate_proj.weight": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.65.gate_proj.weight_scale": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.65.up_proj.weight": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.65.up_proj.weight_scale": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.66.down_proj.weight": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.66.down_proj.weight_scale": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.66.gate_proj.weight": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.66.gate_proj.weight_scale": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.66.up_proj.weight": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.66.up_proj.weight_scale": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.67.down_proj.weight": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.67.down_proj.weight_scale": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.67.gate_proj.weight": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.67.gate_proj.weight_scale": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.67.up_proj.weight": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.67.up_proj.weight_scale": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.68.down_proj.weight": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.68.down_proj.weight_scale": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.68.gate_proj.weight": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.68.gate_proj.weight_scale": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.68.up_proj.weight": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.68.up_proj.weight_scale": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.69.down_proj.weight": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.69.down_proj.weight_scale": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.69.gate_proj.weight": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.69.gate_proj.weight_scale": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.69.up_proj.weight": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.69.up_proj.weight_scale": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.7.down_proj.weight": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.7.down_proj.weight_scale": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.7.gate_proj.weight": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.7.gate_proj.weight_scale": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.7.up_proj.weight": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.7.up_proj.weight_scale": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.70.down_proj.weight": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.70.down_proj.weight_scale": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.70.gate_proj.weight": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.70.gate_proj.weight_scale": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.70.up_proj.weight": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.70.up_proj.weight_scale": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.71.down_proj.weight": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.71.down_proj.weight_scale": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.71.gate_proj.weight": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.71.gate_proj.weight_scale": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.71.up_proj.weight": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.71.up_proj.weight_scale": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.72.down_proj.weight": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.72.down_proj.weight_scale": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.72.gate_proj.weight": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.72.gate_proj.weight_scale": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.72.up_proj.weight": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.72.up_proj.weight_scale": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.73.down_proj.weight": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.73.down_proj.weight_scale": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.73.gate_proj.weight": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.73.gate_proj.weight_scale": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.73.up_proj.weight": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.73.up_proj.weight_scale": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.74.down_proj.weight": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.74.down_proj.weight_scale": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.74.gate_proj.weight": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.74.gate_proj.weight_scale": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.74.up_proj.weight": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.74.up_proj.weight_scale": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.75.down_proj.weight": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.75.down_proj.weight_scale": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.75.gate_proj.weight": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.75.gate_proj.weight_scale": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.75.up_proj.weight": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.75.up_proj.weight_scale": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.76.down_proj.weight": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.76.down_proj.weight_scale": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.76.gate_proj.weight": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.76.gate_proj.weight_scale": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.76.up_proj.weight": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.76.up_proj.weight_scale": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.77.down_proj.weight": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.77.down_proj.weight_scale": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.77.gate_proj.weight": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.77.gate_proj.weight_scale": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.77.up_proj.weight": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.77.up_proj.weight_scale": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.78.down_proj.weight": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.78.down_proj.weight_scale": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.78.gate_proj.weight": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.78.gate_proj.weight_scale": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.78.up_proj.weight": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.78.up_proj.weight_scale": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.79.down_proj.weight": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.79.down_proj.weight_scale": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.79.gate_proj.weight": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.79.gate_proj.weight_scale": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.79.up_proj.weight": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.79.up_proj.weight_scale": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.8.down_proj.weight": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.8.down_proj.weight_scale": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.8.gate_proj.weight": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.8.gate_proj.weight_scale": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.8.up_proj.weight": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.8.up_proj.weight_scale": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.80.down_proj.weight": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.80.down_proj.weight_scale": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.80.gate_proj.weight": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.80.gate_proj.weight_scale": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.80.up_proj.weight": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.80.up_proj.weight_scale": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.81.down_proj.weight": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.81.down_proj.weight_scale": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.81.gate_proj.weight": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.81.gate_proj.weight_scale": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.81.up_proj.weight": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.81.up_proj.weight_scale": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.82.down_proj.weight": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.82.down_proj.weight_scale": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.82.gate_proj.weight": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.82.gate_proj.weight_scale": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.82.up_proj.weight": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.82.up_proj.weight_scale": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.83.down_proj.weight": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.83.down_proj.weight_scale": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.83.gate_proj.weight": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.83.gate_proj.weight_scale": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.83.up_proj.weight": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.83.up_proj.weight_scale": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.84.down_proj.weight": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.84.down_proj.weight_scale": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.84.gate_proj.weight": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.84.gate_proj.weight_scale": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.84.up_proj.weight": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.84.up_proj.weight_scale": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.85.down_proj.weight": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.85.down_proj.weight_scale": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.85.gate_proj.weight": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.85.gate_proj.weight_scale": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.85.up_proj.weight": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.85.up_proj.weight_scale": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.86.down_proj.weight": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.86.down_proj.weight_scale": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.86.gate_proj.weight": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.86.gate_proj.weight_scale": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.86.up_proj.weight": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.86.up_proj.weight_scale": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.87.down_proj.weight": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.87.down_proj.weight_scale": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.87.gate_proj.weight": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.87.gate_proj.weight_scale": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.87.up_proj.weight": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.87.up_proj.weight_scale": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.88.down_proj.weight": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.88.down_proj.weight_scale": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.88.gate_proj.weight": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.88.gate_proj.weight_scale": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.88.up_proj.weight": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.88.up_proj.weight_scale": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.89.down_proj.weight": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.89.down_proj.weight_scale": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.89.gate_proj.weight": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.89.gate_proj.weight_scale": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.89.up_proj.weight": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.89.up_proj.weight_scale": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.9.down_proj.weight": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.9.down_proj.weight_scale": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.9.gate_proj.weight": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.9.gate_proj.weight_scale": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.9.up_proj.weight": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.9.up_proj.weight_scale": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.90.down_proj.weight": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.90.down_proj.weight_scale": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.90.gate_proj.weight": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.90.gate_proj.weight_scale": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.90.up_proj.weight": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.90.up_proj.weight_scale": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.91.down_proj.weight": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.91.down_proj.weight_scale": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.91.gate_proj.weight": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.91.gate_proj.weight_scale": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.91.up_proj.weight": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.91.up_proj.weight_scale": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.92.down_proj.weight": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.92.down_proj.weight_scale": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.92.gate_proj.weight": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.92.gate_proj.weight_scale": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.92.up_proj.weight": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.92.up_proj.weight_scale": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.93.down_proj.weight": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.93.down_proj.weight_scale": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.93.gate_proj.weight": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.93.gate_proj.weight_scale": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.93.up_proj.weight": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.93.up_proj.weight_scale": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.94.down_proj.weight": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.94.down_proj.weight_scale": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.94.gate_proj.weight": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.94.gate_proj.weight_scale": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.94.up_proj.weight": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.94.up_proj.weight_scale": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.95.down_proj.weight": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.95.down_proj.weight_scale": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.95.gate_proj.weight": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.95.gate_proj.weight_scale": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.95.up_proj.weight": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.95.up_proj.weight_scale": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.96.down_proj.weight": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.96.down_proj.weight_scale": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.96.gate_proj.weight": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.96.gate_proj.weight_scale": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.96.up_proj.weight": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.96.up_proj.weight_scale": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.97.down_proj.weight": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.97.down_proj.weight_scale": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.97.gate_proj.weight": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.97.gate_proj.weight_scale": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.97.up_proj.weight": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.97.up_proj.weight_scale": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.98.down_proj.weight": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.98.down_proj.weight_scale": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.98.gate_proj.weight": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.98.gate_proj.weight_scale": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.98.up_proj.weight": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.98.up_proj.weight_scale": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.99.down_proj.weight": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.99.down_proj.weight_scale": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.99.gate_proj.weight": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.99.gate_proj.weight_scale": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.99.up_proj.weight": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.99.up_proj.weight_scale": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.gate.e_score_correction_bias": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.gate.weight": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.shared_experts.down_proj.weight": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.shared_experts.down_proj.weight_scale": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.shared_experts.gate_proj.weight": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.shared_experts.gate_proj.weight_scale": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.shared_experts.up_proj.weight": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.shared_experts.up_proj.weight_scale": "model-00057-of-00092.safetensors",
+ "model.layers.56.post_attention_layernorm.weight": "model-00057-of-00092.safetensors",
+ "model.layers.56.self_attn.k_norm.weight": "model-00057-of-00092.safetensors",
+ "model.layers.56.self_attn.k_proj.bias": "model-00057-of-00092.safetensors",
+ "model.layers.56.self_attn.k_proj.weight": "model-00057-of-00092.safetensors",
+ "model.layers.56.self_attn.k_proj.weight_scale": "model-00057-of-00092.safetensors",
+ "model.layers.56.self_attn.o_proj.weight": "model-00057-of-00092.safetensors",
+ "model.layers.56.self_attn.o_proj.weight_scale": "model-00057-of-00092.safetensors",
+ "model.layers.56.self_attn.q_norm.weight": "model-00057-of-00092.safetensors",
+ "model.layers.56.self_attn.q_proj.bias": "model-00057-of-00092.safetensors",
+ "model.layers.56.self_attn.q_proj.weight": "model-00057-of-00092.safetensors",
+ "model.layers.56.self_attn.q_proj.weight_scale": "model-00057-of-00092.safetensors",
+ "model.layers.56.self_attn.v_proj.bias": "model-00057-of-00092.safetensors",
+ "model.layers.56.self_attn.v_proj.weight": "model-00057-of-00092.safetensors",
+ "model.layers.56.self_attn.v_proj.weight_scale": "model-00057-of-00092.safetensors",
+ "model.layers.57.input_layernorm.weight": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.0.down_proj.weight": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.0.down_proj.weight_scale": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.0.gate_proj.weight": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.0.gate_proj.weight_scale": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.0.up_proj.weight": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.0.up_proj.weight_scale": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.1.down_proj.weight": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.1.down_proj.weight_scale": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.1.gate_proj.weight": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.1.gate_proj.weight_scale": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.1.up_proj.weight": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.1.up_proj.weight_scale": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.10.down_proj.weight": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.10.down_proj.weight_scale": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.10.gate_proj.weight": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.10.gate_proj.weight_scale": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.10.up_proj.weight": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.10.up_proj.weight_scale": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.100.down_proj.weight": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.100.down_proj.weight_scale": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.100.gate_proj.weight": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.100.gate_proj.weight_scale": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.100.up_proj.weight": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.100.up_proj.weight_scale": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.101.down_proj.weight": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.101.down_proj.weight_scale": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.101.gate_proj.weight": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.101.gate_proj.weight_scale": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.101.up_proj.weight": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.101.up_proj.weight_scale": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.102.down_proj.weight": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.102.down_proj.weight_scale": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.102.gate_proj.weight": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.102.gate_proj.weight_scale": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.102.up_proj.weight": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.102.up_proj.weight_scale": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.103.down_proj.weight": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.103.down_proj.weight_scale": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.103.gate_proj.weight": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.103.gate_proj.weight_scale": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.103.up_proj.weight": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.103.up_proj.weight_scale": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.104.down_proj.weight": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.104.down_proj.weight_scale": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.104.gate_proj.weight": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.104.gate_proj.weight_scale": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.104.up_proj.weight": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.104.up_proj.weight_scale": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.105.down_proj.weight": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.105.down_proj.weight_scale": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.105.gate_proj.weight": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.105.gate_proj.weight_scale": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.105.up_proj.weight": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.105.up_proj.weight_scale": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.106.down_proj.weight": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.106.down_proj.weight_scale": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.106.gate_proj.weight": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.106.gate_proj.weight_scale": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.106.up_proj.weight": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.106.up_proj.weight_scale": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.107.down_proj.weight": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.107.down_proj.weight_scale": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.107.gate_proj.weight": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.107.gate_proj.weight_scale": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.107.up_proj.weight": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.107.up_proj.weight_scale": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.108.down_proj.weight": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.108.down_proj.weight_scale": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.108.gate_proj.weight": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.108.gate_proj.weight_scale": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.108.up_proj.weight": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.108.up_proj.weight_scale": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.109.down_proj.weight": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.109.down_proj.weight_scale": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.109.gate_proj.weight": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.109.gate_proj.weight_scale": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.109.up_proj.weight": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.109.up_proj.weight_scale": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.11.down_proj.weight": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.11.down_proj.weight_scale": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.11.gate_proj.weight": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.11.gate_proj.weight_scale": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.11.up_proj.weight": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.11.up_proj.weight_scale": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.110.down_proj.weight": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.110.down_proj.weight_scale": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.110.gate_proj.weight": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.110.gate_proj.weight_scale": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.110.up_proj.weight": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.110.up_proj.weight_scale": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.111.down_proj.weight": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.111.down_proj.weight_scale": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.111.gate_proj.weight": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.111.gate_proj.weight_scale": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.111.up_proj.weight": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.111.up_proj.weight_scale": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.112.down_proj.weight": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.112.down_proj.weight_scale": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.112.gate_proj.weight": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.112.gate_proj.weight_scale": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.112.up_proj.weight": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.112.up_proj.weight_scale": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.113.down_proj.weight": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.113.down_proj.weight_scale": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.113.gate_proj.weight": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.113.gate_proj.weight_scale": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.113.up_proj.weight": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.113.up_proj.weight_scale": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.114.down_proj.weight": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.114.down_proj.weight_scale": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.114.gate_proj.weight": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.114.gate_proj.weight_scale": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.114.up_proj.weight": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.114.up_proj.weight_scale": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.115.down_proj.weight": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.115.down_proj.weight_scale": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.115.gate_proj.weight": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.115.gate_proj.weight_scale": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.115.up_proj.weight": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.115.up_proj.weight_scale": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.116.down_proj.weight": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.116.down_proj.weight_scale": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.116.gate_proj.weight": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.116.gate_proj.weight_scale": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.116.up_proj.weight": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.116.up_proj.weight_scale": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.117.down_proj.weight": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.117.down_proj.weight_scale": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.117.gate_proj.weight": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.117.gate_proj.weight_scale": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.117.up_proj.weight": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.117.up_proj.weight_scale": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.118.down_proj.weight": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.118.down_proj.weight_scale": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.118.gate_proj.weight": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.118.gate_proj.weight_scale": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.118.up_proj.weight": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.118.up_proj.weight_scale": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.119.down_proj.weight": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.119.down_proj.weight_scale": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.119.gate_proj.weight": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.119.gate_proj.weight_scale": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.119.up_proj.weight": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.119.up_proj.weight_scale": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.12.down_proj.weight": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.12.down_proj.weight_scale": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.12.gate_proj.weight": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.12.gate_proj.weight_scale": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.12.up_proj.weight": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.12.up_proj.weight_scale": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.120.down_proj.weight": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.120.down_proj.weight_scale": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.120.gate_proj.weight": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.120.gate_proj.weight_scale": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.120.up_proj.weight": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.120.up_proj.weight_scale": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.121.down_proj.weight": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.121.down_proj.weight_scale": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.121.gate_proj.weight": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.121.gate_proj.weight_scale": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.121.up_proj.weight": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.121.up_proj.weight_scale": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.122.down_proj.weight": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.122.down_proj.weight_scale": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.122.gate_proj.weight": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.122.gate_proj.weight_scale": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.122.up_proj.weight": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.122.up_proj.weight_scale": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.123.down_proj.weight": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.123.down_proj.weight_scale": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.123.gate_proj.weight": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.123.gate_proj.weight_scale": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.123.up_proj.weight": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.123.up_proj.weight_scale": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.124.down_proj.weight": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.124.down_proj.weight_scale": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.124.gate_proj.weight": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.124.gate_proj.weight_scale": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.124.up_proj.weight": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.124.up_proj.weight_scale": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.125.down_proj.weight": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.125.down_proj.weight_scale": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.125.gate_proj.weight": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.125.gate_proj.weight_scale": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.125.up_proj.weight": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.125.up_proj.weight_scale": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.126.down_proj.weight": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.126.down_proj.weight_scale": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.126.gate_proj.weight": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.126.gate_proj.weight_scale": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.126.up_proj.weight": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.126.up_proj.weight_scale": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.127.down_proj.weight": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.127.down_proj.weight_scale": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.127.gate_proj.weight": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.127.gate_proj.weight_scale": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.127.up_proj.weight": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.127.up_proj.weight_scale": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.128.down_proj.weight": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.128.down_proj.weight_scale": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.128.gate_proj.weight": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.128.gate_proj.weight_scale": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.128.up_proj.weight": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.128.up_proj.weight_scale": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.129.down_proj.weight": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.129.down_proj.weight_scale": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.129.gate_proj.weight": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.129.gate_proj.weight_scale": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.129.up_proj.weight": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.129.up_proj.weight_scale": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.13.down_proj.weight": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.13.down_proj.weight_scale": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.13.gate_proj.weight": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.13.gate_proj.weight_scale": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.13.up_proj.weight": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.13.up_proj.weight_scale": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.130.down_proj.weight": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.130.down_proj.weight_scale": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.130.gate_proj.weight": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.130.gate_proj.weight_scale": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.130.up_proj.weight": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.130.up_proj.weight_scale": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.131.down_proj.weight": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.131.down_proj.weight_scale": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.131.gate_proj.weight": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.131.gate_proj.weight_scale": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.131.up_proj.weight": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.131.up_proj.weight_scale": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.132.down_proj.weight": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.132.down_proj.weight_scale": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.132.gate_proj.weight": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.132.gate_proj.weight_scale": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.132.up_proj.weight": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.132.up_proj.weight_scale": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.133.down_proj.weight": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.133.down_proj.weight_scale": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.133.gate_proj.weight": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.133.gate_proj.weight_scale": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.133.up_proj.weight": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.133.up_proj.weight_scale": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.134.down_proj.weight": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.134.down_proj.weight_scale": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.134.gate_proj.weight": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.134.gate_proj.weight_scale": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.134.up_proj.weight": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.134.up_proj.weight_scale": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.135.down_proj.weight": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.135.down_proj.weight_scale": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.135.gate_proj.weight": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.135.gate_proj.weight_scale": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.135.up_proj.weight": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.135.up_proj.weight_scale": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.136.down_proj.weight": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.136.down_proj.weight_scale": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.136.gate_proj.weight": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.136.gate_proj.weight_scale": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.136.up_proj.weight": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.136.up_proj.weight_scale": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.137.down_proj.weight": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.137.down_proj.weight_scale": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.137.gate_proj.weight": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.137.gate_proj.weight_scale": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.137.up_proj.weight": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.137.up_proj.weight_scale": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.138.down_proj.weight": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.138.down_proj.weight_scale": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.138.gate_proj.weight": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.138.gate_proj.weight_scale": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.138.up_proj.weight": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.138.up_proj.weight_scale": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.139.down_proj.weight": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.139.down_proj.weight_scale": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.139.gate_proj.weight": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.139.gate_proj.weight_scale": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.139.up_proj.weight": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.139.up_proj.weight_scale": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.14.down_proj.weight": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.14.down_proj.weight_scale": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.14.gate_proj.weight": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.14.gate_proj.weight_scale": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.14.up_proj.weight": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.14.up_proj.weight_scale": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.140.down_proj.weight": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.140.down_proj.weight_scale": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.140.gate_proj.weight": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.140.gate_proj.weight_scale": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.140.up_proj.weight": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.140.up_proj.weight_scale": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.141.down_proj.weight": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.141.down_proj.weight_scale": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.141.gate_proj.weight": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.141.gate_proj.weight_scale": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.141.up_proj.weight": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.141.up_proj.weight_scale": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.142.down_proj.weight": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.142.down_proj.weight_scale": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.142.gate_proj.weight": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.142.gate_proj.weight_scale": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.142.up_proj.weight": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.142.up_proj.weight_scale": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.143.down_proj.weight": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.143.down_proj.weight_scale": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.143.gate_proj.weight": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.143.gate_proj.weight_scale": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.143.up_proj.weight": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.143.up_proj.weight_scale": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.144.down_proj.weight": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.144.down_proj.weight_scale": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.144.gate_proj.weight": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.144.gate_proj.weight_scale": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.144.up_proj.weight": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.144.up_proj.weight_scale": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.145.down_proj.weight": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.145.down_proj.weight_scale": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.145.gate_proj.weight": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.145.gate_proj.weight_scale": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.145.up_proj.weight": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.145.up_proj.weight_scale": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.146.down_proj.weight": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.146.down_proj.weight_scale": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.146.gate_proj.weight": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.146.gate_proj.weight_scale": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.146.up_proj.weight": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.146.up_proj.weight_scale": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.147.down_proj.weight": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.147.down_proj.weight_scale": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.147.gate_proj.weight": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.147.gate_proj.weight_scale": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.147.up_proj.weight": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.147.up_proj.weight_scale": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.148.down_proj.weight": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.148.down_proj.weight_scale": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.148.gate_proj.weight": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.148.gate_proj.weight_scale": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.148.up_proj.weight": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.148.up_proj.weight_scale": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.149.down_proj.weight": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.149.down_proj.weight_scale": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.149.gate_proj.weight": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.149.gate_proj.weight_scale": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.149.up_proj.weight": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.149.up_proj.weight_scale": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.15.down_proj.weight": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.15.down_proj.weight_scale": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.15.gate_proj.weight": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.15.gate_proj.weight_scale": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.15.up_proj.weight": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.15.up_proj.weight_scale": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.150.down_proj.weight": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.150.down_proj.weight_scale": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.150.gate_proj.weight": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.150.gate_proj.weight_scale": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.150.up_proj.weight": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.150.up_proj.weight_scale": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.151.down_proj.weight": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.151.down_proj.weight_scale": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.151.gate_proj.weight": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.151.gate_proj.weight_scale": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.151.up_proj.weight": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.151.up_proj.weight_scale": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.152.down_proj.weight": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.152.down_proj.weight_scale": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.152.gate_proj.weight": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.152.gate_proj.weight_scale": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.152.up_proj.weight": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.152.up_proj.weight_scale": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.153.down_proj.weight": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.153.down_proj.weight_scale": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.153.gate_proj.weight": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.153.gate_proj.weight_scale": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.153.up_proj.weight": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.153.up_proj.weight_scale": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.154.down_proj.weight": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.154.down_proj.weight_scale": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.154.gate_proj.weight": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.154.gate_proj.weight_scale": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.154.up_proj.weight": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.154.up_proj.weight_scale": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.155.down_proj.weight": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.155.down_proj.weight_scale": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.155.gate_proj.weight": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.155.gate_proj.weight_scale": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.155.up_proj.weight": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.155.up_proj.weight_scale": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.156.down_proj.weight": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.156.down_proj.weight_scale": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.156.gate_proj.weight": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.156.gate_proj.weight_scale": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.156.up_proj.weight": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.156.up_proj.weight_scale": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.157.down_proj.weight": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.157.down_proj.weight_scale": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.157.gate_proj.weight": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.157.gate_proj.weight_scale": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.157.up_proj.weight": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.157.up_proj.weight_scale": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.158.down_proj.weight": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.158.down_proj.weight_scale": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.158.gate_proj.weight": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.158.gate_proj.weight_scale": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.158.up_proj.weight": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.158.up_proj.weight_scale": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.159.down_proj.weight": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.159.down_proj.weight_scale": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.159.gate_proj.weight": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.159.gate_proj.weight_scale": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.159.up_proj.weight": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.159.up_proj.weight_scale": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.16.down_proj.weight": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.16.down_proj.weight_scale": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.16.gate_proj.weight": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.16.gate_proj.weight_scale": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.16.up_proj.weight": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.16.up_proj.weight_scale": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.17.down_proj.weight": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.17.down_proj.weight_scale": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.17.gate_proj.weight": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.17.gate_proj.weight_scale": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.17.up_proj.weight": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.17.up_proj.weight_scale": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.18.down_proj.weight": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.18.down_proj.weight_scale": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.18.gate_proj.weight": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.18.gate_proj.weight_scale": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.18.up_proj.weight": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.18.up_proj.weight_scale": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.19.down_proj.weight": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.19.down_proj.weight_scale": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.19.gate_proj.weight": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.19.gate_proj.weight_scale": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.19.up_proj.weight": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.19.up_proj.weight_scale": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.2.down_proj.weight": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.2.down_proj.weight_scale": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.2.gate_proj.weight": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.2.gate_proj.weight_scale": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.2.up_proj.weight": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.2.up_proj.weight_scale": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.20.down_proj.weight": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.20.down_proj.weight_scale": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.20.gate_proj.weight": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.20.gate_proj.weight_scale": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.20.up_proj.weight": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.20.up_proj.weight_scale": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.21.down_proj.weight": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.21.down_proj.weight_scale": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.21.gate_proj.weight": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.21.gate_proj.weight_scale": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.21.up_proj.weight": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.21.up_proj.weight_scale": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.22.down_proj.weight": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.22.down_proj.weight_scale": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.22.gate_proj.weight": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.22.gate_proj.weight_scale": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.22.up_proj.weight": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.22.up_proj.weight_scale": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.23.down_proj.weight": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.23.down_proj.weight_scale": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.23.gate_proj.weight": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.23.gate_proj.weight_scale": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.23.up_proj.weight": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.23.up_proj.weight_scale": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.24.down_proj.weight": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.24.down_proj.weight_scale": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.24.gate_proj.weight": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.24.gate_proj.weight_scale": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.24.up_proj.weight": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.24.up_proj.weight_scale": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.25.down_proj.weight": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.25.down_proj.weight_scale": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.25.gate_proj.weight": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.25.gate_proj.weight_scale": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.25.up_proj.weight": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.25.up_proj.weight_scale": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.26.down_proj.weight": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.26.down_proj.weight_scale": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.26.gate_proj.weight": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.26.gate_proj.weight_scale": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.26.up_proj.weight": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.26.up_proj.weight_scale": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.27.down_proj.weight": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.27.down_proj.weight_scale": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.27.gate_proj.weight": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.27.gate_proj.weight_scale": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.27.up_proj.weight": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.27.up_proj.weight_scale": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.28.down_proj.weight": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.28.down_proj.weight_scale": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.28.gate_proj.weight": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.28.gate_proj.weight_scale": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.28.up_proj.weight": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.28.up_proj.weight_scale": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.29.down_proj.weight": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.29.down_proj.weight_scale": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.29.gate_proj.weight": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.29.gate_proj.weight_scale": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.29.up_proj.weight": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.29.up_proj.weight_scale": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.3.down_proj.weight": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.3.down_proj.weight_scale": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.3.gate_proj.weight": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.3.gate_proj.weight_scale": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.3.up_proj.weight": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.3.up_proj.weight_scale": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.30.down_proj.weight": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.30.down_proj.weight_scale": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.30.gate_proj.weight": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.30.gate_proj.weight_scale": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.30.up_proj.weight": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.30.up_proj.weight_scale": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.31.down_proj.weight": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.31.down_proj.weight_scale": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.31.gate_proj.weight": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.31.gate_proj.weight_scale": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.31.up_proj.weight": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.31.up_proj.weight_scale": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.32.down_proj.weight": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.32.down_proj.weight_scale": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.32.gate_proj.weight": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.32.gate_proj.weight_scale": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.32.up_proj.weight": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.32.up_proj.weight_scale": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.33.down_proj.weight": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.33.down_proj.weight_scale": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.33.gate_proj.weight": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.33.gate_proj.weight_scale": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.33.up_proj.weight": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.33.up_proj.weight_scale": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.34.down_proj.weight": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.34.down_proj.weight_scale": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.34.gate_proj.weight": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.34.gate_proj.weight_scale": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.34.up_proj.weight": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.34.up_proj.weight_scale": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.35.down_proj.weight": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.35.down_proj.weight_scale": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.35.gate_proj.weight": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.35.gate_proj.weight_scale": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.35.up_proj.weight": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.35.up_proj.weight_scale": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.36.down_proj.weight": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.36.down_proj.weight_scale": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.36.gate_proj.weight": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.36.gate_proj.weight_scale": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.36.up_proj.weight": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.36.up_proj.weight_scale": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.37.down_proj.weight": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.37.down_proj.weight_scale": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.37.gate_proj.weight": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.37.gate_proj.weight_scale": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.37.up_proj.weight": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.37.up_proj.weight_scale": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.38.down_proj.weight": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.38.down_proj.weight_scale": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.38.gate_proj.weight": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.38.gate_proj.weight_scale": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.38.up_proj.weight": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.38.up_proj.weight_scale": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.39.down_proj.weight": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.39.down_proj.weight_scale": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.39.gate_proj.weight": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.39.gate_proj.weight_scale": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.39.up_proj.weight": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.39.up_proj.weight_scale": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.4.down_proj.weight": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.4.down_proj.weight_scale": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.4.gate_proj.weight": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.4.gate_proj.weight_scale": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.4.up_proj.weight": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.4.up_proj.weight_scale": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.40.down_proj.weight": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.40.down_proj.weight_scale": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.40.gate_proj.weight": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.40.gate_proj.weight_scale": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.40.up_proj.weight": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.40.up_proj.weight_scale": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.41.down_proj.weight": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.41.down_proj.weight_scale": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.41.gate_proj.weight": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.41.gate_proj.weight_scale": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.41.up_proj.weight": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.41.up_proj.weight_scale": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.42.down_proj.weight": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.42.down_proj.weight_scale": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.42.gate_proj.weight": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.42.gate_proj.weight_scale": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.42.up_proj.weight": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.42.up_proj.weight_scale": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.43.down_proj.weight": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.43.down_proj.weight_scale": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.43.gate_proj.weight": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.43.gate_proj.weight_scale": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.43.up_proj.weight": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.43.up_proj.weight_scale": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.44.down_proj.weight": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.44.down_proj.weight_scale": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.44.gate_proj.weight": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.44.gate_proj.weight_scale": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.44.up_proj.weight": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.44.up_proj.weight_scale": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.45.down_proj.weight": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.45.down_proj.weight_scale": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.45.gate_proj.weight": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.45.gate_proj.weight_scale": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.45.up_proj.weight": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.45.up_proj.weight_scale": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.46.down_proj.weight": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.46.down_proj.weight_scale": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.46.gate_proj.weight": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.46.gate_proj.weight_scale": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.46.up_proj.weight": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.46.up_proj.weight_scale": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.47.down_proj.weight": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.47.down_proj.weight_scale": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.47.gate_proj.weight": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.47.gate_proj.weight_scale": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.47.up_proj.weight": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.47.up_proj.weight_scale": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.48.down_proj.weight": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.48.down_proj.weight_scale": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.48.gate_proj.weight": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.48.gate_proj.weight_scale": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.48.up_proj.weight": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.48.up_proj.weight_scale": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.49.down_proj.weight": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.49.down_proj.weight_scale": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.49.gate_proj.weight": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.49.gate_proj.weight_scale": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.49.up_proj.weight": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.49.up_proj.weight_scale": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.5.down_proj.weight": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.5.down_proj.weight_scale": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.5.gate_proj.weight": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.5.gate_proj.weight_scale": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.5.up_proj.weight": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.5.up_proj.weight_scale": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.50.down_proj.weight": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.50.down_proj.weight_scale": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.50.gate_proj.weight": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.50.gate_proj.weight_scale": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.50.up_proj.weight": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.50.up_proj.weight_scale": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.51.down_proj.weight": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.51.down_proj.weight_scale": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.51.gate_proj.weight": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.51.gate_proj.weight_scale": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.51.up_proj.weight": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.51.up_proj.weight_scale": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.52.down_proj.weight": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.52.down_proj.weight_scale": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.52.gate_proj.weight": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.52.gate_proj.weight_scale": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.52.up_proj.weight": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.52.up_proj.weight_scale": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.53.down_proj.weight": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.53.down_proj.weight_scale": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.53.gate_proj.weight": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.53.gate_proj.weight_scale": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.53.up_proj.weight": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.53.up_proj.weight_scale": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.54.down_proj.weight": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.54.down_proj.weight_scale": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.54.gate_proj.weight": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.54.gate_proj.weight_scale": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.54.up_proj.weight": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.54.up_proj.weight_scale": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.55.down_proj.weight": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.55.down_proj.weight_scale": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.55.gate_proj.weight": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.55.gate_proj.weight_scale": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.55.up_proj.weight": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.55.up_proj.weight_scale": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.56.down_proj.weight": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.56.down_proj.weight_scale": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.56.gate_proj.weight": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.56.gate_proj.weight_scale": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.56.up_proj.weight": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.56.up_proj.weight_scale": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.57.down_proj.weight": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.57.down_proj.weight_scale": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.57.gate_proj.weight": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.57.gate_proj.weight_scale": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.57.up_proj.weight": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.57.up_proj.weight_scale": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.58.down_proj.weight": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.58.down_proj.weight_scale": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.58.gate_proj.weight": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.58.gate_proj.weight_scale": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.58.up_proj.weight": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.58.up_proj.weight_scale": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.59.down_proj.weight": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.59.down_proj.weight_scale": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.59.gate_proj.weight": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.59.gate_proj.weight_scale": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.59.up_proj.weight": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.59.up_proj.weight_scale": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.6.down_proj.weight": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.6.down_proj.weight_scale": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.6.gate_proj.weight": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.6.gate_proj.weight_scale": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.6.up_proj.weight": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.6.up_proj.weight_scale": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.60.down_proj.weight": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.60.down_proj.weight_scale": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.60.gate_proj.weight": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.60.gate_proj.weight_scale": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.60.up_proj.weight": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.60.up_proj.weight_scale": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.61.down_proj.weight": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.61.down_proj.weight_scale": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.61.gate_proj.weight": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.61.gate_proj.weight_scale": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.61.up_proj.weight": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.61.up_proj.weight_scale": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.62.down_proj.weight": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.62.down_proj.weight_scale": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.62.gate_proj.weight": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.62.gate_proj.weight_scale": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.62.up_proj.weight": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.62.up_proj.weight_scale": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.63.down_proj.weight": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.63.down_proj.weight_scale": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.63.gate_proj.weight": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.63.gate_proj.weight_scale": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.63.up_proj.weight": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.63.up_proj.weight_scale": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.64.down_proj.weight": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.64.down_proj.weight_scale": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.64.gate_proj.weight": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.64.gate_proj.weight_scale": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.64.up_proj.weight": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.64.up_proj.weight_scale": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.65.down_proj.weight": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.65.down_proj.weight_scale": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.65.gate_proj.weight": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.65.gate_proj.weight_scale": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.65.up_proj.weight": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.65.up_proj.weight_scale": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.66.down_proj.weight": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.66.down_proj.weight_scale": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.66.gate_proj.weight": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.66.gate_proj.weight_scale": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.66.up_proj.weight": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.66.up_proj.weight_scale": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.67.down_proj.weight": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.67.down_proj.weight_scale": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.67.gate_proj.weight": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.67.gate_proj.weight_scale": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.67.up_proj.weight": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.67.up_proj.weight_scale": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.68.down_proj.weight": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.68.down_proj.weight_scale": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.68.gate_proj.weight": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.68.gate_proj.weight_scale": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.68.up_proj.weight": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.68.up_proj.weight_scale": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.69.down_proj.weight": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.69.down_proj.weight_scale": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.69.gate_proj.weight": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.69.gate_proj.weight_scale": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.69.up_proj.weight": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.69.up_proj.weight_scale": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.7.down_proj.weight": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.7.down_proj.weight_scale": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.7.gate_proj.weight": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.7.gate_proj.weight_scale": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.7.up_proj.weight": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.7.up_proj.weight_scale": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.70.down_proj.weight": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.70.down_proj.weight_scale": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.70.gate_proj.weight": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.70.gate_proj.weight_scale": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.70.up_proj.weight": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.70.up_proj.weight_scale": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.71.down_proj.weight": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.71.down_proj.weight_scale": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.71.gate_proj.weight": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.71.gate_proj.weight_scale": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.71.up_proj.weight": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.71.up_proj.weight_scale": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.72.down_proj.weight": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.72.down_proj.weight_scale": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.72.gate_proj.weight": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.72.gate_proj.weight_scale": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.72.up_proj.weight": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.72.up_proj.weight_scale": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.73.down_proj.weight": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.73.down_proj.weight_scale": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.73.gate_proj.weight": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.73.gate_proj.weight_scale": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.73.up_proj.weight": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.73.up_proj.weight_scale": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.74.down_proj.weight": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.74.down_proj.weight_scale": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.74.gate_proj.weight": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.74.gate_proj.weight_scale": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.74.up_proj.weight": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.74.up_proj.weight_scale": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.75.down_proj.weight": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.75.down_proj.weight_scale": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.75.gate_proj.weight": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.75.gate_proj.weight_scale": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.75.up_proj.weight": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.75.up_proj.weight_scale": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.76.down_proj.weight": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.76.down_proj.weight_scale": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.76.gate_proj.weight": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.76.gate_proj.weight_scale": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.76.up_proj.weight": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.76.up_proj.weight_scale": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.77.down_proj.weight": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.77.down_proj.weight_scale": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.77.gate_proj.weight": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.77.gate_proj.weight_scale": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.77.up_proj.weight": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.77.up_proj.weight_scale": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.78.down_proj.weight": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.78.down_proj.weight_scale": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.78.gate_proj.weight": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.78.gate_proj.weight_scale": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.78.up_proj.weight": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.78.up_proj.weight_scale": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.79.down_proj.weight": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.79.down_proj.weight_scale": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.79.gate_proj.weight": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.79.gate_proj.weight_scale": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.79.up_proj.weight": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.79.up_proj.weight_scale": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.8.down_proj.weight": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.8.down_proj.weight_scale": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.8.gate_proj.weight": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.8.gate_proj.weight_scale": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.8.up_proj.weight": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.8.up_proj.weight_scale": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.80.down_proj.weight": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.80.down_proj.weight_scale": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.80.gate_proj.weight": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.80.gate_proj.weight_scale": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.80.up_proj.weight": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.80.up_proj.weight_scale": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.81.down_proj.weight": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.81.down_proj.weight_scale": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.81.gate_proj.weight": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.81.gate_proj.weight_scale": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.81.up_proj.weight": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.81.up_proj.weight_scale": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.82.down_proj.weight": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.82.down_proj.weight_scale": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.82.gate_proj.weight": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.82.gate_proj.weight_scale": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.82.up_proj.weight": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.82.up_proj.weight_scale": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.83.down_proj.weight": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.83.down_proj.weight_scale": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.83.gate_proj.weight": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.83.gate_proj.weight_scale": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.83.up_proj.weight": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.83.up_proj.weight_scale": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.84.down_proj.weight": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.84.down_proj.weight_scale": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.84.gate_proj.weight": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.84.gate_proj.weight_scale": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.84.up_proj.weight": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.84.up_proj.weight_scale": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.85.down_proj.weight": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.85.down_proj.weight_scale": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.85.gate_proj.weight": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.85.gate_proj.weight_scale": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.85.up_proj.weight": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.85.up_proj.weight_scale": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.86.down_proj.weight": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.86.down_proj.weight_scale": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.86.gate_proj.weight": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.86.gate_proj.weight_scale": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.86.up_proj.weight": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.86.up_proj.weight_scale": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.87.down_proj.weight": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.87.down_proj.weight_scale": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.87.gate_proj.weight": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.87.gate_proj.weight_scale": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.87.up_proj.weight": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.87.up_proj.weight_scale": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.88.down_proj.weight": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.88.down_proj.weight_scale": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.88.gate_proj.weight": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.88.gate_proj.weight_scale": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.88.up_proj.weight": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.88.up_proj.weight_scale": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.89.down_proj.weight": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.89.down_proj.weight_scale": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.89.gate_proj.weight": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.89.gate_proj.weight_scale": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.89.up_proj.weight": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.89.up_proj.weight_scale": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.9.down_proj.weight": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.9.down_proj.weight_scale": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.9.gate_proj.weight": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.9.gate_proj.weight_scale": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.9.up_proj.weight": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.9.up_proj.weight_scale": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.90.down_proj.weight": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.90.down_proj.weight_scale": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.90.gate_proj.weight": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.90.gate_proj.weight_scale": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.90.up_proj.weight": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.90.up_proj.weight_scale": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.91.down_proj.weight": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.91.down_proj.weight_scale": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.91.gate_proj.weight": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.91.gate_proj.weight_scale": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.91.up_proj.weight": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.91.up_proj.weight_scale": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.92.down_proj.weight": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.92.down_proj.weight_scale": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.92.gate_proj.weight": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.92.gate_proj.weight_scale": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.92.up_proj.weight": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.92.up_proj.weight_scale": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.93.down_proj.weight": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.93.down_proj.weight_scale": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.93.gate_proj.weight": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.93.gate_proj.weight_scale": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.93.up_proj.weight": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.93.up_proj.weight_scale": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.94.down_proj.weight": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.94.down_proj.weight_scale": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.94.gate_proj.weight": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.94.gate_proj.weight_scale": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.94.up_proj.weight": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.94.up_proj.weight_scale": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.95.down_proj.weight": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.95.down_proj.weight_scale": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.95.gate_proj.weight": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.95.gate_proj.weight_scale": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.95.up_proj.weight": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.95.up_proj.weight_scale": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.96.down_proj.weight": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.96.down_proj.weight_scale": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.96.gate_proj.weight": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.96.gate_proj.weight_scale": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.96.up_proj.weight": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.96.up_proj.weight_scale": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.97.down_proj.weight": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.97.down_proj.weight_scale": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.97.gate_proj.weight": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.97.gate_proj.weight_scale": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.97.up_proj.weight": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.97.up_proj.weight_scale": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.98.down_proj.weight": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.98.down_proj.weight_scale": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.98.gate_proj.weight": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.98.gate_proj.weight_scale": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.98.up_proj.weight": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.98.up_proj.weight_scale": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.99.down_proj.weight": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.99.down_proj.weight_scale": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.99.gate_proj.weight": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.99.gate_proj.weight_scale": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.99.up_proj.weight": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.99.up_proj.weight_scale": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.gate.e_score_correction_bias": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.gate.weight": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.shared_experts.down_proj.weight": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.shared_experts.down_proj.weight_scale": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.shared_experts.gate_proj.weight": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.shared_experts.gate_proj.weight_scale": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.shared_experts.up_proj.weight": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.shared_experts.up_proj.weight_scale": "model-00058-of-00092.safetensors",
+ "model.layers.57.post_attention_layernorm.weight": "model-00058-of-00092.safetensors",
+ "model.layers.57.self_attn.k_norm.weight": "model-00058-of-00092.safetensors",
+ "model.layers.57.self_attn.k_proj.bias": "model-00058-of-00092.safetensors",
+ "model.layers.57.self_attn.k_proj.weight": "model-00058-of-00092.safetensors",
+ "model.layers.57.self_attn.k_proj.weight_scale": "model-00058-of-00092.safetensors",
+ "model.layers.57.self_attn.o_proj.weight": "model-00058-of-00092.safetensors",
+ "model.layers.57.self_attn.o_proj.weight_scale": "model-00058-of-00092.safetensors",
+ "model.layers.57.self_attn.q_norm.weight": "model-00058-of-00092.safetensors",
+ "model.layers.57.self_attn.q_proj.bias": "model-00058-of-00092.safetensors",
+ "model.layers.57.self_attn.q_proj.weight": "model-00058-of-00092.safetensors",
+ "model.layers.57.self_attn.q_proj.weight_scale": "model-00058-of-00092.safetensors",
+ "model.layers.57.self_attn.v_proj.bias": "model-00058-of-00092.safetensors",
+ "model.layers.57.self_attn.v_proj.weight": "model-00058-of-00092.safetensors",
+ "model.layers.57.self_attn.v_proj.weight_scale": "model-00058-of-00092.safetensors",
+ "model.layers.58.input_layernorm.weight": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.0.down_proj.weight": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.0.down_proj.weight_scale": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.0.gate_proj.weight": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.0.gate_proj.weight_scale": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.0.up_proj.weight": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.0.up_proj.weight_scale": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.1.down_proj.weight": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.1.down_proj.weight_scale": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.1.gate_proj.weight": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.1.gate_proj.weight_scale": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.1.up_proj.weight": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.1.up_proj.weight_scale": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.10.down_proj.weight": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.10.down_proj.weight_scale": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.10.gate_proj.weight": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.10.gate_proj.weight_scale": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.10.up_proj.weight": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.10.up_proj.weight_scale": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.100.down_proj.weight": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.100.down_proj.weight_scale": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.100.gate_proj.weight": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.100.gate_proj.weight_scale": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.100.up_proj.weight": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.100.up_proj.weight_scale": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.101.down_proj.weight": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.101.down_proj.weight_scale": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.101.gate_proj.weight": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.101.gate_proj.weight_scale": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.101.up_proj.weight": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.101.up_proj.weight_scale": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.102.down_proj.weight": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.102.down_proj.weight_scale": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.102.gate_proj.weight": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.102.gate_proj.weight_scale": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.102.up_proj.weight": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.102.up_proj.weight_scale": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.103.down_proj.weight": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.103.down_proj.weight_scale": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.103.gate_proj.weight": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.103.gate_proj.weight_scale": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.103.up_proj.weight": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.103.up_proj.weight_scale": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.104.down_proj.weight": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.104.down_proj.weight_scale": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.104.gate_proj.weight": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.104.gate_proj.weight_scale": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.104.up_proj.weight": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.104.up_proj.weight_scale": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.105.down_proj.weight": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.105.down_proj.weight_scale": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.105.gate_proj.weight": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.105.gate_proj.weight_scale": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.105.up_proj.weight": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.105.up_proj.weight_scale": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.106.down_proj.weight": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.106.down_proj.weight_scale": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.106.gate_proj.weight": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.106.gate_proj.weight_scale": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.106.up_proj.weight": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.106.up_proj.weight_scale": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.107.down_proj.weight": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.107.down_proj.weight_scale": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.107.gate_proj.weight": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.107.gate_proj.weight_scale": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.107.up_proj.weight": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.107.up_proj.weight_scale": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.108.down_proj.weight": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.108.down_proj.weight_scale": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.108.gate_proj.weight": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.108.gate_proj.weight_scale": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.108.up_proj.weight": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.108.up_proj.weight_scale": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.109.down_proj.weight": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.109.down_proj.weight_scale": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.109.gate_proj.weight": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.109.gate_proj.weight_scale": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.109.up_proj.weight": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.109.up_proj.weight_scale": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.11.down_proj.weight": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.11.down_proj.weight_scale": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.11.gate_proj.weight": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.11.gate_proj.weight_scale": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.11.up_proj.weight": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.11.up_proj.weight_scale": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.110.down_proj.weight": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.110.down_proj.weight_scale": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.110.gate_proj.weight": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.110.gate_proj.weight_scale": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.110.up_proj.weight": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.110.up_proj.weight_scale": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.111.down_proj.weight": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.111.down_proj.weight_scale": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.111.gate_proj.weight": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.111.gate_proj.weight_scale": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.111.up_proj.weight": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.111.up_proj.weight_scale": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.112.down_proj.weight": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.112.down_proj.weight_scale": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.112.gate_proj.weight": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.112.gate_proj.weight_scale": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.112.up_proj.weight": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.112.up_proj.weight_scale": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.113.down_proj.weight": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.113.down_proj.weight_scale": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.113.gate_proj.weight": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.113.gate_proj.weight_scale": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.113.up_proj.weight": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.113.up_proj.weight_scale": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.114.down_proj.weight": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.114.down_proj.weight_scale": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.114.gate_proj.weight": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.114.gate_proj.weight_scale": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.114.up_proj.weight": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.114.up_proj.weight_scale": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.115.down_proj.weight": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.115.down_proj.weight_scale": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.115.gate_proj.weight": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.115.gate_proj.weight_scale": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.115.up_proj.weight": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.115.up_proj.weight_scale": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.116.down_proj.weight": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.116.down_proj.weight_scale": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.116.gate_proj.weight": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.116.gate_proj.weight_scale": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.116.up_proj.weight": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.116.up_proj.weight_scale": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.117.down_proj.weight": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.117.down_proj.weight_scale": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.117.gate_proj.weight": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.117.gate_proj.weight_scale": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.117.up_proj.weight": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.117.up_proj.weight_scale": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.118.down_proj.weight": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.118.down_proj.weight_scale": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.118.gate_proj.weight": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.118.gate_proj.weight_scale": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.118.up_proj.weight": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.118.up_proj.weight_scale": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.119.down_proj.weight": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.119.down_proj.weight_scale": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.119.gate_proj.weight": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.119.gate_proj.weight_scale": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.119.up_proj.weight": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.119.up_proj.weight_scale": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.12.down_proj.weight": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.12.down_proj.weight_scale": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.12.gate_proj.weight": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.12.gate_proj.weight_scale": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.12.up_proj.weight": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.12.up_proj.weight_scale": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.120.down_proj.weight": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.120.down_proj.weight_scale": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.120.gate_proj.weight": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.120.gate_proj.weight_scale": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.120.up_proj.weight": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.120.up_proj.weight_scale": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.121.down_proj.weight": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.121.down_proj.weight_scale": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.121.gate_proj.weight": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.121.gate_proj.weight_scale": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.121.up_proj.weight": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.121.up_proj.weight_scale": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.122.down_proj.weight": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.122.down_proj.weight_scale": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.122.gate_proj.weight": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.122.gate_proj.weight_scale": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.122.up_proj.weight": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.122.up_proj.weight_scale": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.123.down_proj.weight": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.123.down_proj.weight_scale": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.123.gate_proj.weight": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.123.gate_proj.weight_scale": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.123.up_proj.weight": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.123.up_proj.weight_scale": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.124.down_proj.weight": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.124.down_proj.weight_scale": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.124.gate_proj.weight": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.124.gate_proj.weight_scale": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.124.up_proj.weight": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.124.up_proj.weight_scale": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.125.down_proj.weight": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.125.down_proj.weight_scale": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.125.gate_proj.weight": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.125.gate_proj.weight_scale": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.125.up_proj.weight": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.125.up_proj.weight_scale": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.126.down_proj.weight": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.126.down_proj.weight_scale": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.126.gate_proj.weight": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.126.gate_proj.weight_scale": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.126.up_proj.weight": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.126.up_proj.weight_scale": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.127.down_proj.weight": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.127.down_proj.weight_scale": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.127.gate_proj.weight": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.127.gate_proj.weight_scale": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.127.up_proj.weight": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.127.up_proj.weight_scale": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.128.down_proj.weight": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.128.down_proj.weight_scale": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.128.gate_proj.weight": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.128.gate_proj.weight_scale": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.128.up_proj.weight": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.128.up_proj.weight_scale": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.129.down_proj.weight": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.129.down_proj.weight_scale": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.129.gate_proj.weight": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.129.gate_proj.weight_scale": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.129.up_proj.weight": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.129.up_proj.weight_scale": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.13.down_proj.weight": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.13.down_proj.weight_scale": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.13.gate_proj.weight": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.13.gate_proj.weight_scale": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.13.up_proj.weight": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.13.up_proj.weight_scale": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.130.down_proj.weight": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.130.down_proj.weight_scale": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.130.gate_proj.weight": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.130.gate_proj.weight_scale": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.130.up_proj.weight": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.130.up_proj.weight_scale": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.131.down_proj.weight": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.131.down_proj.weight_scale": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.131.gate_proj.weight": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.131.gate_proj.weight_scale": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.131.up_proj.weight": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.131.up_proj.weight_scale": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.132.down_proj.weight": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.132.down_proj.weight_scale": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.132.gate_proj.weight": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.132.gate_proj.weight_scale": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.132.up_proj.weight": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.132.up_proj.weight_scale": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.133.down_proj.weight": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.133.down_proj.weight_scale": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.133.gate_proj.weight": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.133.gate_proj.weight_scale": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.133.up_proj.weight": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.133.up_proj.weight_scale": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.134.down_proj.weight": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.134.down_proj.weight_scale": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.134.gate_proj.weight": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.134.gate_proj.weight_scale": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.134.up_proj.weight": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.134.up_proj.weight_scale": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.135.down_proj.weight": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.135.down_proj.weight_scale": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.135.gate_proj.weight": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.135.gate_proj.weight_scale": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.135.up_proj.weight": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.135.up_proj.weight_scale": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.136.down_proj.weight": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.136.down_proj.weight_scale": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.136.gate_proj.weight": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.136.gate_proj.weight_scale": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.136.up_proj.weight": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.136.up_proj.weight_scale": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.137.down_proj.weight": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.137.down_proj.weight_scale": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.137.gate_proj.weight": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.137.gate_proj.weight_scale": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.137.up_proj.weight": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.137.up_proj.weight_scale": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.138.down_proj.weight": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.138.down_proj.weight_scale": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.138.gate_proj.weight": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.138.gate_proj.weight_scale": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.138.up_proj.weight": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.138.up_proj.weight_scale": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.139.down_proj.weight": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.139.down_proj.weight_scale": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.139.gate_proj.weight": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.139.gate_proj.weight_scale": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.139.up_proj.weight": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.139.up_proj.weight_scale": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.14.down_proj.weight": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.14.down_proj.weight_scale": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.14.gate_proj.weight": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.14.gate_proj.weight_scale": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.14.up_proj.weight": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.14.up_proj.weight_scale": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.140.down_proj.weight": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.140.down_proj.weight_scale": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.140.gate_proj.weight": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.140.gate_proj.weight_scale": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.140.up_proj.weight": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.140.up_proj.weight_scale": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.141.down_proj.weight": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.141.down_proj.weight_scale": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.141.gate_proj.weight": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.141.gate_proj.weight_scale": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.141.up_proj.weight": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.141.up_proj.weight_scale": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.142.down_proj.weight": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.142.down_proj.weight_scale": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.142.gate_proj.weight": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.142.gate_proj.weight_scale": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.142.up_proj.weight": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.142.up_proj.weight_scale": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.143.down_proj.weight": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.143.down_proj.weight_scale": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.143.gate_proj.weight": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.143.gate_proj.weight_scale": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.143.up_proj.weight": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.143.up_proj.weight_scale": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.144.down_proj.weight": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.144.down_proj.weight_scale": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.144.gate_proj.weight": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.144.gate_proj.weight_scale": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.144.up_proj.weight": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.144.up_proj.weight_scale": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.145.down_proj.weight": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.145.down_proj.weight_scale": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.145.gate_proj.weight": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.145.gate_proj.weight_scale": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.145.up_proj.weight": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.145.up_proj.weight_scale": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.146.down_proj.weight": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.146.down_proj.weight_scale": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.146.gate_proj.weight": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.146.gate_proj.weight_scale": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.146.up_proj.weight": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.146.up_proj.weight_scale": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.147.down_proj.weight": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.147.down_proj.weight_scale": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.147.gate_proj.weight": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.147.gate_proj.weight_scale": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.147.up_proj.weight": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.147.up_proj.weight_scale": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.148.down_proj.weight": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.148.down_proj.weight_scale": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.148.gate_proj.weight": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.148.gate_proj.weight_scale": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.148.up_proj.weight": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.148.up_proj.weight_scale": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.149.down_proj.weight": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.149.down_proj.weight_scale": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.149.gate_proj.weight": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.149.gate_proj.weight_scale": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.149.up_proj.weight": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.149.up_proj.weight_scale": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.15.down_proj.weight": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.15.down_proj.weight_scale": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.15.gate_proj.weight": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.15.gate_proj.weight_scale": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.15.up_proj.weight": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.15.up_proj.weight_scale": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.150.down_proj.weight": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.150.down_proj.weight_scale": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.150.gate_proj.weight": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.150.gate_proj.weight_scale": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.150.up_proj.weight": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.150.up_proj.weight_scale": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.151.down_proj.weight": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.151.down_proj.weight_scale": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.151.gate_proj.weight": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.151.gate_proj.weight_scale": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.151.up_proj.weight": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.151.up_proj.weight_scale": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.152.down_proj.weight": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.152.down_proj.weight_scale": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.152.gate_proj.weight": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.152.gate_proj.weight_scale": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.152.up_proj.weight": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.152.up_proj.weight_scale": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.153.down_proj.weight": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.153.down_proj.weight_scale": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.153.gate_proj.weight": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.153.gate_proj.weight_scale": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.153.up_proj.weight": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.153.up_proj.weight_scale": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.154.down_proj.weight": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.154.down_proj.weight_scale": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.154.gate_proj.weight": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.154.gate_proj.weight_scale": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.154.up_proj.weight": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.154.up_proj.weight_scale": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.155.down_proj.weight": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.155.down_proj.weight_scale": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.155.gate_proj.weight": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.155.gate_proj.weight_scale": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.155.up_proj.weight": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.155.up_proj.weight_scale": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.156.down_proj.weight": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.156.down_proj.weight_scale": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.156.gate_proj.weight": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.156.gate_proj.weight_scale": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.156.up_proj.weight": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.156.up_proj.weight_scale": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.157.down_proj.weight": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.157.down_proj.weight_scale": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.157.gate_proj.weight": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.157.gate_proj.weight_scale": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.157.up_proj.weight": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.157.up_proj.weight_scale": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.158.down_proj.weight": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.158.down_proj.weight_scale": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.158.gate_proj.weight": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.158.gate_proj.weight_scale": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.158.up_proj.weight": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.158.up_proj.weight_scale": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.159.down_proj.weight": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.159.down_proj.weight_scale": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.159.gate_proj.weight": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.159.gate_proj.weight_scale": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.159.up_proj.weight": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.159.up_proj.weight_scale": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.16.down_proj.weight": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.16.down_proj.weight_scale": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.16.gate_proj.weight": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.16.gate_proj.weight_scale": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.16.up_proj.weight": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.16.up_proj.weight_scale": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.17.down_proj.weight": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.17.down_proj.weight_scale": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.17.gate_proj.weight": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.17.gate_proj.weight_scale": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.17.up_proj.weight": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.17.up_proj.weight_scale": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.18.down_proj.weight": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.18.down_proj.weight_scale": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.18.gate_proj.weight": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.18.gate_proj.weight_scale": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.18.up_proj.weight": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.18.up_proj.weight_scale": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.19.down_proj.weight": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.19.down_proj.weight_scale": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.19.gate_proj.weight": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.19.gate_proj.weight_scale": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.19.up_proj.weight": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.19.up_proj.weight_scale": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.2.down_proj.weight": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.2.down_proj.weight_scale": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.2.gate_proj.weight": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.2.gate_proj.weight_scale": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.2.up_proj.weight": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.2.up_proj.weight_scale": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.20.down_proj.weight": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.20.down_proj.weight_scale": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.20.gate_proj.weight": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.20.gate_proj.weight_scale": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.20.up_proj.weight": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.20.up_proj.weight_scale": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.21.down_proj.weight": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.21.down_proj.weight_scale": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.21.gate_proj.weight": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.21.gate_proj.weight_scale": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.21.up_proj.weight": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.21.up_proj.weight_scale": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.22.down_proj.weight": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.22.down_proj.weight_scale": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.22.gate_proj.weight": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.22.gate_proj.weight_scale": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.22.up_proj.weight": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.22.up_proj.weight_scale": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.23.down_proj.weight": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.23.down_proj.weight_scale": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.23.gate_proj.weight": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.23.gate_proj.weight_scale": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.23.up_proj.weight": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.23.up_proj.weight_scale": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.24.down_proj.weight": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.24.down_proj.weight_scale": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.24.gate_proj.weight": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.24.gate_proj.weight_scale": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.24.up_proj.weight": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.24.up_proj.weight_scale": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.25.down_proj.weight": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.25.down_proj.weight_scale": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.25.gate_proj.weight": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.25.gate_proj.weight_scale": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.25.up_proj.weight": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.25.up_proj.weight_scale": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.26.down_proj.weight": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.26.down_proj.weight_scale": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.26.gate_proj.weight": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.26.gate_proj.weight_scale": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.26.up_proj.weight": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.26.up_proj.weight_scale": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.27.down_proj.weight": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.27.down_proj.weight_scale": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.27.gate_proj.weight": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.27.gate_proj.weight_scale": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.27.up_proj.weight": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.27.up_proj.weight_scale": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.28.down_proj.weight": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.28.down_proj.weight_scale": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.28.gate_proj.weight": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.28.gate_proj.weight_scale": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.28.up_proj.weight": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.28.up_proj.weight_scale": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.29.down_proj.weight": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.29.down_proj.weight_scale": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.29.gate_proj.weight": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.29.gate_proj.weight_scale": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.29.up_proj.weight": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.29.up_proj.weight_scale": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.3.down_proj.weight": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.3.down_proj.weight_scale": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.3.gate_proj.weight": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.3.gate_proj.weight_scale": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.3.up_proj.weight": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.3.up_proj.weight_scale": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.30.down_proj.weight": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.30.down_proj.weight_scale": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.30.gate_proj.weight": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.30.gate_proj.weight_scale": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.30.up_proj.weight": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.30.up_proj.weight_scale": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.31.down_proj.weight": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.31.down_proj.weight_scale": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.31.gate_proj.weight": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.31.gate_proj.weight_scale": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.31.up_proj.weight": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.31.up_proj.weight_scale": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.32.down_proj.weight": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.32.down_proj.weight_scale": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.32.gate_proj.weight": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.32.gate_proj.weight_scale": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.32.up_proj.weight": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.32.up_proj.weight_scale": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.33.down_proj.weight": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.33.down_proj.weight_scale": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.33.gate_proj.weight": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.33.gate_proj.weight_scale": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.33.up_proj.weight": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.33.up_proj.weight_scale": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.34.down_proj.weight": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.34.down_proj.weight_scale": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.34.gate_proj.weight": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.34.gate_proj.weight_scale": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.34.up_proj.weight": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.34.up_proj.weight_scale": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.35.down_proj.weight": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.35.down_proj.weight_scale": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.35.gate_proj.weight": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.35.gate_proj.weight_scale": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.35.up_proj.weight": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.35.up_proj.weight_scale": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.36.down_proj.weight": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.36.down_proj.weight_scale": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.36.gate_proj.weight": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.36.gate_proj.weight_scale": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.36.up_proj.weight": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.36.up_proj.weight_scale": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.37.down_proj.weight": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.37.down_proj.weight_scale": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.37.gate_proj.weight": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.37.gate_proj.weight_scale": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.37.up_proj.weight": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.37.up_proj.weight_scale": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.38.down_proj.weight": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.38.down_proj.weight_scale": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.38.gate_proj.weight": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.38.gate_proj.weight_scale": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.38.up_proj.weight": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.38.up_proj.weight_scale": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.39.down_proj.weight": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.39.down_proj.weight_scale": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.39.gate_proj.weight": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.39.gate_proj.weight_scale": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.39.up_proj.weight": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.39.up_proj.weight_scale": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.4.down_proj.weight": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.4.down_proj.weight_scale": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.4.gate_proj.weight": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.4.gate_proj.weight_scale": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.4.up_proj.weight": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.4.up_proj.weight_scale": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.40.down_proj.weight": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.40.down_proj.weight_scale": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.40.gate_proj.weight": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.40.gate_proj.weight_scale": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.40.up_proj.weight": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.40.up_proj.weight_scale": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.41.down_proj.weight": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.41.down_proj.weight_scale": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.41.gate_proj.weight": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.41.gate_proj.weight_scale": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.41.up_proj.weight": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.41.up_proj.weight_scale": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.42.down_proj.weight": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.42.down_proj.weight_scale": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.42.gate_proj.weight": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.42.gate_proj.weight_scale": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.42.up_proj.weight": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.42.up_proj.weight_scale": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.43.down_proj.weight": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.43.down_proj.weight_scale": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.43.gate_proj.weight": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.43.gate_proj.weight_scale": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.43.up_proj.weight": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.43.up_proj.weight_scale": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.44.down_proj.weight": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.44.down_proj.weight_scale": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.44.gate_proj.weight": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.44.gate_proj.weight_scale": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.44.up_proj.weight": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.44.up_proj.weight_scale": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.45.down_proj.weight": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.45.down_proj.weight_scale": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.45.gate_proj.weight": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.45.gate_proj.weight_scale": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.45.up_proj.weight": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.45.up_proj.weight_scale": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.46.down_proj.weight": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.46.down_proj.weight_scale": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.46.gate_proj.weight": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.46.gate_proj.weight_scale": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.46.up_proj.weight": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.46.up_proj.weight_scale": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.47.down_proj.weight": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.47.down_proj.weight_scale": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.47.gate_proj.weight": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.47.gate_proj.weight_scale": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.47.up_proj.weight": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.47.up_proj.weight_scale": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.48.down_proj.weight": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.48.down_proj.weight_scale": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.48.gate_proj.weight": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.48.gate_proj.weight_scale": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.48.up_proj.weight": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.48.up_proj.weight_scale": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.49.down_proj.weight": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.49.down_proj.weight_scale": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.49.gate_proj.weight": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.49.gate_proj.weight_scale": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.49.up_proj.weight": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.49.up_proj.weight_scale": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.5.down_proj.weight": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.5.down_proj.weight_scale": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.5.gate_proj.weight": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.5.gate_proj.weight_scale": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.5.up_proj.weight": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.5.up_proj.weight_scale": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.50.down_proj.weight": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.50.down_proj.weight_scale": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.50.gate_proj.weight": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.50.gate_proj.weight_scale": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.50.up_proj.weight": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.50.up_proj.weight_scale": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.51.down_proj.weight": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.51.down_proj.weight_scale": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.51.gate_proj.weight": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.51.gate_proj.weight_scale": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.51.up_proj.weight": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.51.up_proj.weight_scale": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.52.down_proj.weight": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.52.down_proj.weight_scale": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.52.gate_proj.weight": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.52.gate_proj.weight_scale": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.52.up_proj.weight": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.52.up_proj.weight_scale": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.53.down_proj.weight": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.53.down_proj.weight_scale": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.53.gate_proj.weight": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.53.gate_proj.weight_scale": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.53.up_proj.weight": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.53.up_proj.weight_scale": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.54.down_proj.weight": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.54.down_proj.weight_scale": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.54.gate_proj.weight": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.54.gate_proj.weight_scale": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.54.up_proj.weight": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.54.up_proj.weight_scale": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.55.down_proj.weight": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.55.down_proj.weight_scale": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.55.gate_proj.weight": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.55.gate_proj.weight_scale": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.55.up_proj.weight": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.55.up_proj.weight_scale": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.56.down_proj.weight": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.56.down_proj.weight_scale": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.56.gate_proj.weight": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.56.gate_proj.weight_scale": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.56.up_proj.weight": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.56.up_proj.weight_scale": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.57.down_proj.weight": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.57.down_proj.weight_scale": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.57.gate_proj.weight": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.57.gate_proj.weight_scale": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.57.up_proj.weight": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.57.up_proj.weight_scale": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.58.down_proj.weight": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.58.down_proj.weight_scale": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.58.gate_proj.weight": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.58.gate_proj.weight_scale": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.58.up_proj.weight": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.58.up_proj.weight_scale": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.59.down_proj.weight": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.59.down_proj.weight_scale": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.59.gate_proj.weight": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.59.gate_proj.weight_scale": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.59.up_proj.weight": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.59.up_proj.weight_scale": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.6.down_proj.weight": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.6.down_proj.weight_scale": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.6.gate_proj.weight": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.6.gate_proj.weight_scale": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.6.up_proj.weight": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.6.up_proj.weight_scale": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.60.down_proj.weight": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.60.down_proj.weight_scale": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.60.gate_proj.weight": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.60.gate_proj.weight_scale": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.60.up_proj.weight": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.60.up_proj.weight_scale": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.61.down_proj.weight": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.61.down_proj.weight_scale": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.61.gate_proj.weight": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.61.gate_proj.weight_scale": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.61.up_proj.weight": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.61.up_proj.weight_scale": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.62.down_proj.weight": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.62.down_proj.weight_scale": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.62.gate_proj.weight": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.62.gate_proj.weight_scale": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.62.up_proj.weight": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.62.up_proj.weight_scale": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.63.down_proj.weight": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.63.down_proj.weight_scale": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.63.gate_proj.weight": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.63.gate_proj.weight_scale": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.63.up_proj.weight": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.63.up_proj.weight_scale": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.64.down_proj.weight": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.64.down_proj.weight_scale": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.64.gate_proj.weight": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.64.gate_proj.weight_scale": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.64.up_proj.weight": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.64.up_proj.weight_scale": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.65.down_proj.weight": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.65.down_proj.weight_scale": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.65.gate_proj.weight": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.65.gate_proj.weight_scale": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.65.up_proj.weight": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.65.up_proj.weight_scale": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.66.down_proj.weight": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.66.down_proj.weight_scale": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.66.gate_proj.weight": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.66.gate_proj.weight_scale": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.66.up_proj.weight": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.66.up_proj.weight_scale": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.67.down_proj.weight": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.67.down_proj.weight_scale": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.67.gate_proj.weight": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.67.gate_proj.weight_scale": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.67.up_proj.weight": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.67.up_proj.weight_scale": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.68.down_proj.weight": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.68.down_proj.weight_scale": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.68.gate_proj.weight": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.68.gate_proj.weight_scale": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.68.up_proj.weight": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.68.up_proj.weight_scale": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.69.down_proj.weight": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.69.down_proj.weight_scale": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.69.gate_proj.weight": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.69.gate_proj.weight_scale": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.69.up_proj.weight": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.69.up_proj.weight_scale": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.7.down_proj.weight": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.7.down_proj.weight_scale": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.7.gate_proj.weight": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.7.gate_proj.weight_scale": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.7.up_proj.weight": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.7.up_proj.weight_scale": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.70.down_proj.weight": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.70.down_proj.weight_scale": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.70.gate_proj.weight": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.70.gate_proj.weight_scale": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.70.up_proj.weight": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.70.up_proj.weight_scale": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.71.down_proj.weight": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.71.down_proj.weight_scale": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.71.gate_proj.weight": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.71.gate_proj.weight_scale": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.71.up_proj.weight": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.71.up_proj.weight_scale": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.72.down_proj.weight": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.72.down_proj.weight_scale": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.72.gate_proj.weight": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.72.gate_proj.weight_scale": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.72.up_proj.weight": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.72.up_proj.weight_scale": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.73.down_proj.weight": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.73.down_proj.weight_scale": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.73.gate_proj.weight": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.73.gate_proj.weight_scale": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.73.up_proj.weight": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.73.up_proj.weight_scale": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.74.down_proj.weight": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.74.down_proj.weight_scale": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.74.gate_proj.weight": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.74.gate_proj.weight_scale": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.74.up_proj.weight": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.74.up_proj.weight_scale": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.75.down_proj.weight": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.75.down_proj.weight_scale": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.75.gate_proj.weight": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.75.gate_proj.weight_scale": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.75.up_proj.weight": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.75.up_proj.weight_scale": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.76.down_proj.weight": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.76.down_proj.weight_scale": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.76.gate_proj.weight": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.76.gate_proj.weight_scale": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.76.up_proj.weight": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.76.up_proj.weight_scale": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.77.down_proj.weight": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.77.down_proj.weight_scale": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.77.gate_proj.weight": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.77.gate_proj.weight_scale": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.77.up_proj.weight": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.77.up_proj.weight_scale": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.78.down_proj.weight": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.78.down_proj.weight_scale": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.78.gate_proj.weight": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.78.gate_proj.weight_scale": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.78.up_proj.weight": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.78.up_proj.weight_scale": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.79.down_proj.weight": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.79.down_proj.weight_scale": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.79.gate_proj.weight": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.79.gate_proj.weight_scale": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.79.up_proj.weight": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.79.up_proj.weight_scale": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.8.down_proj.weight": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.8.down_proj.weight_scale": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.8.gate_proj.weight": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.8.gate_proj.weight_scale": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.8.up_proj.weight": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.8.up_proj.weight_scale": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.80.down_proj.weight": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.80.down_proj.weight_scale": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.80.gate_proj.weight": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.80.gate_proj.weight_scale": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.80.up_proj.weight": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.80.up_proj.weight_scale": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.81.down_proj.weight": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.81.down_proj.weight_scale": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.81.gate_proj.weight": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.81.gate_proj.weight_scale": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.81.up_proj.weight": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.81.up_proj.weight_scale": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.82.down_proj.weight": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.82.down_proj.weight_scale": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.82.gate_proj.weight": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.82.gate_proj.weight_scale": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.82.up_proj.weight": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.82.up_proj.weight_scale": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.83.down_proj.weight": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.83.down_proj.weight_scale": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.83.gate_proj.weight": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.83.gate_proj.weight_scale": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.83.up_proj.weight": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.83.up_proj.weight_scale": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.84.down_proj.weight": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.84.down_proj.weight_scale": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.84.gate_proj.weight": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.84.gate_proj.weight_scale": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.84.up_proj.weight": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.84.up_proj.weight_scale": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.85.down_proj.weight": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.85.down_proj.weight_scale": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.85.gate_proj.weight": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.85.gate_proj.weight_scale": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.85.up_proj.weight": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.85.up_proj.weight_scale": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.86.down_proj.weight": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.86.down_proj.weight_scale": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.86.gate_proj.weight": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.86.gate_proj.weight_scale": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.86.up_proj.weight": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.86.up_proj.weight_scale": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.87.down_proj.weight": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.87.down_proj.weight_scale": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.87.gate_proj.weight": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.87.gate_proj.weight_scale": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.87.up_proj.weight": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.87.up_proj.weight_scale": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.88.down_proj.weight": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.88.down_proj.weight_scale": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.88.gate_proj.weight": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.88.gate_proj.weight_scale": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.88.up_proj.weight": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.88.up_proj.weight_scale": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.89.down_proj.weight": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.89.down_proj.weight_scale": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.89.gate_proj.weight": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.89.gate_proj.weight_scale": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.89.up_proj.weight": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.89.up_proj.weight_scale": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.9.down_proj.weight": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.9.down_proj.weight_scale": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.9.gate_proj.weight": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.9.gate_proj.weight_scale": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.9.up_proj.weight": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.9.up_proj.weight_scale": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.90.down_proj.weight": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.90.down_proj.weight_scale": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.90.gate_proj.weight": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.90.gate_proj.weight_scale": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.90.up_proj.weight": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.90.up_proj.weight_scale": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.91.down_proj.weight": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.91.down_proj.weight_scale": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.91.gate_proj.weight": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.91.gate_proj.weight_scale": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.91.up_proj.weight": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.91.up_proj.weight_scale": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.92.down_proj.weight": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.92.down_proj.weight_scale": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.92.gate_proj.weight": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.92.gate_proj.weight_scale": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.92.up_proj.weight": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.92.up_proj.weight_scale": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.93.down_proj.weight": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.93.down_proj.weight_scale": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.93.gate_proj.weight": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.93.gate_proj.weight_scale": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.93.up_proj.weight": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.93.up_proj.weight_scale": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.94.down_proj.weight": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.94.down_proj.weight_scale": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.94.gate_proj.weight": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.94.gate_proj.weight_scale": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.94.up_proj.weight": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.94.up_proj.weight_scale": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.95.down_proj.weight": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.95.down_proj.weight_scale": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.95.gate_proj.weight": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.95.gate_proj.weight_scale": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.95.up_proj.weight": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.95.up_proj.weight_scale": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.96.down_proj.weight": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.96.down_proj.weight_scale": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.96.gate_proj.weight": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.96.gate_proj.weight_scale": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.96.up_proj.weight": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.96.up_proj.weight_scale": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.97.down_proj.weight": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.97.down_proj.weight_scale": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.97.gate_proj.weight": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.97.gate_proj.weight_scale": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.97.up_proj.weight": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.97.up_proj.weight_scale": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.98.down_proj.weight": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.98.down_proj.weight_scale": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.98.gate_proj.weight": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.98.gate_proj.weight_scale": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.98.up_proj.weight": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.98.up_proj.weight_scale": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.99.down_proj.weight": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.99.down_proj.weight_scale": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.99.gate_proj.weight": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.99.gate_proj.weight_scale": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.99.up_proj.weight": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.99.up_proj.weight_scale": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.gate.e_score_correction_bias": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.gate.weight": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.shared_experts.down_proj.weight": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.shared_experts.down_proj.weight_scale": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.shared_experts.gate_proj.weight": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.shared_experts.gate_proj.weight_scale": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.shared_experts.up_proj.weight": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.shared_experts.up_proj.weight_scale": "model-00059-of-00092.safetensors",
+ "model.layers.58.post_attention_layernorm.weight": "model-00059-of-00092.safetensors",
+ "model.layers.58.self_attn.k_norm.weight": "model-00059-of-00092.safetensors",
+ "model.layers.58.self_attn.k_proj.bias": "model-00059-of-00092.safetensors",
+ "model.layers.58.self_attn.k_proj.weight": "model-00059-of-00092.safetensors",
+ "model.layers.58.self_attn.k_proj.weight_scale": "model-00059-of-00092.safetensors",
+ "model.layers.58.self_attn.o_proj.weight": "model-00059-of-00092.safetensors",
+ "model.layers.58.self_attn.o_proj.weight_scale": "model-00059-of-00092.safetensors",
+ "model.layers.58.self_attn.q_norm.weight": "model-00059-of-00092.safetensors",
+ "model.layers.58.self_attn.q_proj.bias": "model-00059-of-00092.safetensors",
+ "model.layers.58.self_attn.q_proj.weight": "model-00059-of-00092.safetensors",
+ "model.layers.58.self_attn.q_proj.weight_scale": "model-00059-of-00092.safetensors",
+ "model.layers.58.self_attn.v_proj.bias": "model-00059-of-00092.safetensors",
+ "model.layers.58.self_attn.v_proj.weight": "model-00059-of-00092.safetensors",
+ "model.layers.58.self_attn.v_proj.weight_scale": "model-00059-of-00092.safetensors",
+ "model.layers.59.input_layernorm.weight": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.0.down_proj.weight": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.0.down_proj.weight_scale": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.0.gate_proj.weight": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.0.gate_proj.weight_scale": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.0.up_proj.weight": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.0.up_proj.weight_scale": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.1.down_proj.weight": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.1.down_proj.weight_scale": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.1.gate_proj.weight": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.1.gate_proj.weight_scale": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.1.up_proj.weight": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.1.up_proj.weight_scale": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.10.down_proj.weight": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.10.down_proj.weight_scale": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.10.gate_proj.weight": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.10.gate_proj.weight_scale": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.10.up_proj.weight": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.10.up_proj.weight_scale": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.100.down_proj.weight": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.100.down_proj.weight_scale": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.100.gate_proj.weight": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.100.gate_proj.weight_scale": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.100.up_proj.weight": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.100.up_proj.weight_scale": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.101.down_proj.weight": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.101.down_proj.weight_scale": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.101.gate_proj.weight": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.101.gate_proj.weight_scale": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.101.up_proj.weight": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.101.up_proj.weight_scale": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.102.down_proj.weight": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.102.down_proj.weight_scale": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.102.gate_proj.weight": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.102.gate_proj.weight_scale": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.102.up_proj.weight": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.102.up_proj.weight_scale": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.103.down_proj.weight": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.103.down_proj.weight_scale": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.103.gate_proj.weight": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.103.gate_proj.weight_scale": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.103.up_proj.weight": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.103.up_proj.weight_scale": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.104.down_proj.weight": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.104.down_proj.weight_scale": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.104.gate_proj.weight": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.104.gate_proj.weight_scale": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.104.up_proj.weight": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.104.up_proj.weight_scale": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.105.down_proj.weight": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.105.down_proj.weight_scale": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.105.gate_proj.weight": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.105.gate_proj.weight_scale": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.105.up_proj.weight": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.105.up_proj.weight_scale": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.106.down_proj.weight": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.106.down_proj.weight_scale": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.106.gate_proj.weight": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.106.gate_proj.weight_scale": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.106.up_proj.weight": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.106.up_proj.weight_scale": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.107.down_proj.weight": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.107.down_proj.weight_scale": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.107.gate_proj.weight": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.107.gate_proj.weight_scale": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.107.up_proj.weight": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.107.up_proj.weight_scale": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.108.down_proj.weight": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.108.down_proj.weight_scale": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.108.gate_proj.weight": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.108.gate_proj.weight_scale": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.108.up_proj.weight": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.108.up_proj.weight_scale": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.109.down_proj.weight": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.109.down_proj.weight_scale": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.109.gate_proj.weight": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.109.gate_proj.weight_scale": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.109.up_proj.weight": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.109.up_proj.weight_scale": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.11.down_proj.weight": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.11.down_proj.weight_scale": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.11.gate_proj.weight": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.11.gate_proj.weight_scale": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.11.up_proj.weight": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.11.up_proj.weight_scale": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.110.down_proj.weight": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.110.down_proj.weight_scale": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.110.gate_proj.weight": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.110.gate_proj.weight_scale": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.110.up_proj.weight": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.110.up_proj.weight_scale": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.111.down_proj.weight": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.111.down_proj.weight_scale": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.111.gate_proj.weight": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.111.gate_proj.weight_scale": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.111.up_proj.weight": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.111.up_proj.weight_scale": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.112.down_proj.weight": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.112.down_proj.weight_scale": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.112.gate_proj.weight": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.112.gate_proj.weight_scale": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.112.up_proj.weight": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.112.up_proj.weight_scale": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.113.down_proj.weight": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.113.down_proj.weight_scale": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.113.gate_proj.weight": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.113.gate_proj.weight_scale": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.113.up_proj.weight": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.113.up_proj.weight_scale": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.114.down_proj.weight": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.114.down_proj.weight_scale": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.114.gate_proj.weight": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.114.gate_proj.weight_scale": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.114.up_proj.weight": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.114.up_proj.weight_scale": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.115.down_proj.weight": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.115.down_proj.weight_scale": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.115.gate_proj.weight": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.115.gate_proj.weight_scale": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.115.up_proj.weight": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.115.up_proj.weight_scale": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.116.down_proj.weight": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.116.down_proj.weight_scale": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.116.gate_proj.weight": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.116.gate_proj.weight_scale": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.116.up_proj.weight": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.116.up_proj.weight_scale": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.117.down_proj.weight": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.117.down_proj.weight_scale": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.117.gate_proj.weight": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.117.gate_proj.weight_scale": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.117.up_proj.weight": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.117.up_proj.weight_scale": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.118.down_proj.weight": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.118.down_proj.weight_scale": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.118.gate_proj.weight": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.118.gate_proj.weight_scale": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.118.up_proj.weight": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.118.up_proj.weight_scale": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.119.down_proj.weight": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.119.down_proj.weight_scale": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.119.gate_proj.weight": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.119.gate_proj.weight_scale": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.119.up_proj.weight": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.119.up_proj.weight_scale": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.12.down_proj.weight": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.12.down_proj.weight_scale": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.12.gate_proj.weight": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.12.gate_proj.weight_scale": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.12.up_proj.weight": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.12.up_proj.weight_scale": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.120.down_proj.weight": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.120.down_proj.weight_scale": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.120.gate_proj.weight": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.120.gate_proj.weight_scale": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.120.up_proj.weight": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.120.up_proj.weight_scale": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.121.down_proj.weight": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.121.down_proj.weight_scale": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.121.gate_proj.weight": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.121.gate_proj.weight_scale": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.121.up_proj.weight": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.121.up_proj.weight_scale": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.122.down_proj.weight": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.122.down_proj.weight_scale": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.122.gate_proj.weight": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.122.gate_proj.weight_scale": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.122.up_proj.weight": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.122.up_proj.weight_scale": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.123.down_proj.weight": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.123.down_proj.weight_scale": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.123.gate_proj.weight": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.123.gate_proj.weight_scale": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.123.up_proj.weight": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.123.up_proj.weight_scale": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.124.down_proj.weight": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.124.down_proj.weight_scale": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.124.gate_proj.weight": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.124.gate_proj.weight_scale": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.124.up_proj.weight": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.124.up_proj.weight_scale": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.125.down_proj.weight": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.125.down_proj.weight_scale": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.125.gate_proj.weight": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.125.gate_proj.weight_scale": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.125.up_proj.weight": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.125.up_proj.weight_scale": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.126.down_proj.weight": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.126.down_proj.weight_scale": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.126.gate_proj.weight": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.126.gate_proj.weight_scale": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.126.up_proj.weight": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.126.up_proj.weight_scale": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.127.down_proj.weight": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.127.down_proj.weight_scale": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.127.gate_proj.weight": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.127.gate_proj.weight_scale": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.127.up_proj.weight": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.127.up_proj.weight_scale": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.128.down_proj.weight": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.128.down_proj.weight_scale": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.128.gate_proj.weight": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.128.gate_proj.weight_scale": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.128.up_proj.weight": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.128.up_proj.weight_scale": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.129.down_proj.weight": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.129.down_proj.weight_scale": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.129.gate_proj.weight": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.129.gate_proj.weight_scale": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.129.up_proj.weight": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.129.up_proj.weight_scale": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.13.down_proj.weight": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.13.down_proj.weight_scale": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.13.gate_proj.weight": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.13.gate_proj.weight_scale": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.13.up_proj.weight": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.13.up_proj.weight_scale": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.130.down_proj.weight": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.130.down_proj.weight_scale": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.130.gate_proj.weight": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.130.gate_proj.weight_scale": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.130.up_proj.weight": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.130.up_proj.weight_scale": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.131.down_proj.weight": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.131.down_proj.weight_scale": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.131.gate_proj.weight": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.131.gate_proj.weight_scale": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.131.up_proj.weight": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.131.up_proj.weight_scale": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.132.down_proj.weight": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.132.down_proj.weight_scale": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.132.gate_proj.weight": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.132.gate_proj.weight_scale": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.132.up_proj.weight": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.132.up_proj.weight_scale": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.133.down_proj.weight": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.133.down_proj.weight_scale": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.133.gate_proj.weight": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.133.gate_proj.weight_scale": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.133.up_proj.weight": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.133.up_proj.weight_scale": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.134.down_proj.weight": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.134.down_proj.weight_scale": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.134.gate_proj.weight": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.134.gate_proj.weight_scale": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.134.up_proj.weight": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.134.up_proj.weight_scale": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.135.down_proj.weight": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.135.down_proj.weight_scale": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.135.gate_proj.weight": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.135.gate_proj.weight_scale": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.135.up_proj.weight": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.135.up_proj.weight_scale": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.136.down_proj.weight": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.136.down_proj.weight_scale": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.136.gate_proj.weight": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.136.gate_proj.weight_scale": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.136.up_proj.weight": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.136.up_proj.weight_scale": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.137.down_proj.weight": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.137.down_proj.weight_scale": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.137.gate_proj.weight": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.137.gate_proj.weight_scale": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.137.up_proj.weight": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.137.up_proj.weight_scale": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.138.down_proj.weight": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.138.down_proj.weight_scale": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.138.gate_proj.weight": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.138.gate_proj.weight_scale": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.138.up_proj.weight": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.138.up_proj.weight_scale": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.139.down_proj.weight": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.139.down_proj.weight_scale": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.139.gate_proj.weight": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.139.gate_proj.weight_scale": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.139.up_proj.weight": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.139.up_proj.weight_scale": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.14.down_proj.weight": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.14.down_proj.weight_scale": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.14.gate_proj.weight": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.14.gate_proj.weight_scale": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.14.up_proj.weight": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.14.up_proj.weight_scale": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.140.down_proj.weight": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.140.down_proj.weight_scale": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.140.gate_proj.weight": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.140.gate_proj.weight_scale": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.140.up_proj.weight": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.140.up_proj.weight_scale": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.141.down_proj.weight": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.141.down_proj.weight_scale": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.141.gate_proj.weight": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.141.gate_proj.weight_scale": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.141.up_proj.weight": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.141.up_proj.weight_scale": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.142.down_proj.weight": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.142.down_proj.weight_scale": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.142.gate_proj.weight": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.142.gate_proj.weight_scale": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.142.up_proj.weight": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.142.up_proj.weight_scale": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.143.down_proj.weight": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.143.down_proj.weight_scale": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.143.gate_proj.weight": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.143.gate_proj.weight_scale": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.143.up_proj.weight": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.143.up_proj.weight_scale": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.144.down_proj.weight": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.144.down_proj.weight_scale": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.144.gate_proj.weight": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.144.gate_proj.weight_scale": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.144.up_proj.weight": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.144.up_proj.weight_scale": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.145.down_proj.weight": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.145.down_proj.weight_scale": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.145.gate_proj.weight": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.145.gate_proj.weight_scale": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.145.up_proj.weight": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.145.up_proj.weight_scale": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.146.down_proj.weight": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.146.down_proj.weight_scale": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.146.gate_proj.weight": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.146.gate_proj.weight_scale": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.146.up_proj.weight": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.146.up_proj.weight_scale": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.147.down_proj.weight": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.147.down_proj.weight_scale": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.147.gate_proj.weight": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.147.gate_proj.weight_scale": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.147.up_proj.weight": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.147.up_proj.weight_scale": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.148.down_proj.weight": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.148.down_proj.weight_scale": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.148.gate_proj.weight": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.148.gate_proj.weight_scale": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.148.up_proj.weight": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.148.up_proj.weight_scale": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.149.down_proj.weight": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.149.down_proj.weight_scale": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.149.gate_proj.weight": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.149.gate_proj.weight_scale": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.149.up_proj.weight": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.149.up_proj.weight_scale": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.15.down_proj.weight": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.15.down_proj.weight_scale": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.15.gate_proj.weight": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.15.gate_proj.weight_scale": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.15.up_proj.weight": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.15.up_proj.weight_scale": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.150.down_proj.weight": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.150.down_proj.weight_scale": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.150.gate_proj.weight": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.150.gate_proj.weight_scale": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.150.up_proj.weight": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.150.up_proj.weight_scale": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.151.down_proj.weight": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.151.down_proj.weight_scale": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.151.gate_proj.weight": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.151.gate_proj.weight_scale": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.151.up_proj.weight": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.151.up_proj.weight_scale": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.152.down_proj.weight": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.152.down_proj.weight_scale": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.152.gate_proj.weight": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.152.gate_proj.weight_scale": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.152.up_proj.weight": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.152.up_proj.weight_scale": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.153.down_proj.weight": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.153.down_proj.weight_scale": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.153.gate_proj.weight": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.153.gate_proj.weight_scale": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.153.up_proj.weight": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.153.up_proj.weight_scale": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.154.down_proj.weight": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.154.down_proj.weight_scale": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.154.gate_proj.weight": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.154.gate_proj.weight_scale": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.154.up_proj.weight": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.154.up_proj.weight_scale": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.155.down_proj.weight": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.155.down_proj.weight_scale": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.155.gate_proj.weight": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.155.gate_proj.weight_scale": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.155.up_proj.weight": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.155.up_proj.weight_scale": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.156.down_proj.weight": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.156.down_proj.weight_scale": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.156.gate_proj.weight": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.156.gate_proj.weight_scale": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.156.up_proj.weight": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.156.up_proj.weight_scale": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.157.down_proj.weight": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.157.down_proj.weight_scale": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.157.gate_proj.weight": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.157.gate_proj.weight_scale": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.157.up_proj.weight": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.157.up_proj.weight_scale": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.158.down_proj.weight": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.158.down_proj.weight_scale": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.158.gate_proj.weight": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.158.gate_proj.weight_scale": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.158.up_proj.weight": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.158.up_proj.weight_scale": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.159.down_proj.weight": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.159.down_proj.weight_scale": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.159.gate_proj.weight": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.159.gate_proj.weight_scale": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.159.up_proj.weight": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.159.up_proj.weight_scale": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.16.down_proj.weight": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.16.down_proj.weight_scale": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.16.gate_proj.weight": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.16.gate_proj.weight_scale": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.16.up_proj.weight": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.16.up_proj.weight_scale": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.17.down_proj.weight": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.17.down_proj.weight_scale": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.17.gate_proj.weight": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.17.gate_proj.weight_scale": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.17.up_proj.weight": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.17.up_proj.weight_scale": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.18.down_proj.weight": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.18.down_proj.weight_scale": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.18.gate_proj.weight": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.18.gate_proj.weight_scale": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.18.up_proj.weight": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.18.up_proj.weight_scale": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.19.down_proj.weight": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.19.down_proj.weight_scale": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.19.gate_proj.weight": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.19.gate_proj.weight_scale": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.19.up_proj.weight": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.19.up_proj.weight_scale": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.2.down_proj.weight": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.2.down_proj.weight_scale": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.2.gate_proj.weight": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.2.gate_proj.weight_scale": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.2.up_proj.weight": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.2.up_proj.weight_scale": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.20.down_proj.weight": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.20.down_proj.weight_scale": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.20.gate_proj.weight": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.20.gate_proj.weight_scale": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.20.up_proj.weight": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.20.up_proj.weight_scale": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.21.down_proj.weight": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.21.down_proj.weight_scale": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.21.gate_proj.weight": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.21.gate_proj.weight_scale": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.21.up_proj.weight": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.21.up_proj.weight_scale": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.22.down_proj.weight": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.22.down_proj.weight_scale": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.22.gate_proj.weight": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.22.gate_proj.weight_scale": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.22.up_proj.weight": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.22.up_proj.weight_scale": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.23.down_proj.weight": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.23.down_proj.weight_scale": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.23.gate_proj.weight": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.23.gate_proj.weight_scale": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.23.up_proj.weight": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.23.up_proj.weight_scale": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.24.down_proj.weight": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.24.down_proj.weight_scale": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.24.gate_proj.weight": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.24.gate_proj.weight_scale": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.24.up_proj.weight": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.24.up_proj.weight_scale": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.25.down_proj.weight": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.25.down_proj.weight_scale": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.25.gate_proj.weight": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.25.gate_proj.weight_scale": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.25.up_proj.weight": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.25.up_proj.weight_scale": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.26.down_proj.weight": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.26.down_proj.weight_scale": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.26.gate_proj.weight": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.26.gate_proj.weight_scale": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.26.up_proj.weight": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.26.up_proj.weight_scale": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.27.down_proj.weight": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.27.down_proj.weight_scale": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.27.gate_proj.weight": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.27.gate_proj.weight_scale": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.27.up_proj.weight": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.27.up_proj.weight_scale": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.28.down_proj.weight": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.28.down_proj.weight_scale": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.28.gate_proj.weight": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.28.gate_proj.weight_scale": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.28.up_proj.weight": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.28.up_proj.weight_scale": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.29.down_proj.weight": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.29.down_proj.weight_scale": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.29.gate_proj.weight": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.29.gate_proj.weight_scale": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.29.up_proj.weight": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.29.up_proj.weight_scale": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.3.down_proj.weight": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.3.down_proj.weight_scale": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.3.gate_proj.weight": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.3.gate_proj.weight_scale": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.3.up_proj.weight": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.3.up_proj.weight_scale": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.30.down_proj.weight": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.30.down_proj.weight_scale": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.30.gate_proj.weight": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.30.gate_proj.weight_scale": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.30.up_proj.weight": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.30.up_proj.weight_scale": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.31.down_proj.weight": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.31.down_proj.weight_scale": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.31.gate_proj.weight": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.31.gate_proj.weight_scale": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.31.up_proj.weight": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.31.up_proj.weight_scale": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.32.down_proj.weight": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.32.down_proj.weight_scale": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.32.gate_proj.weight": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.32.gate_proj.weight_scale": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.32.up_proj.weight": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.32.up_proj.weight_scale": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.33.down_proj.weight": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.33.down_proj.weight_scale": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.33.gate_proj.weight": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.33.gate_proj.weight_scale": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.33.up_proj.weight": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.33.up_proj.weight_scale": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.34.down_proj.weight": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.34.down_proj.weight_scale": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.34.gate_proj.weight": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.34.gate_proj.weight_scale": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.34.up_proj.weight": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.34.up_proj.weight_scale": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.35.down_proj.weight": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.35.down_proj.weight_scale": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.35.gate_proj.weight": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.35.gate_proj.weight_scale": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.35.up_proj.weight": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.35.up_proj.weight_scale": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.36.down_proj.weight": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.36.down_proj.weight_scale": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.36.gate_proj.weight": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.36.gate_proj.weight_scale": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.36.up_proj.weight": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.36.up_proj.weight_scale": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.37.down_proj.weight": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.37.down_proj.weight_scale": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.37.gate_proj.weight": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.37.gate_proj.weight_scale": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.37.up_proj.weight": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.37.up_proj.weight_scale": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.38.down_proj.weight": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.38.down_proj.weight_scale": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.38.gate_proj.weight": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.38.gate_proj.weight_scale": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.38.up_proj.weight": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.38.up_proj.weight_scale": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.39.down_proj.weight": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.39.down_proj.weight_scale": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.39.gate_proj.weight": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.39.gate_proj.weight_scale": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.39.up_proj.weight": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.39.up_proj.weight_scale": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.4.down_proj.weight": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.4.down_proj.weight_scale": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.4.gate_proj.weight": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.4.gate_proj.weight_scale": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.4.up_proj.weight": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.4.up_proj.weight_scale": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.40.down_proj.weight": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.40.down_proj.weight_scale": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.40.gate_proj.weight": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.40.gate_proj.weight_scale": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.40.up_proj.weight": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.40.up_proj.weight_scale": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.41.down_proj.weight": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.41.down_proj.weight_scale": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.41.gate_proj.weight": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.41.gate_proj.weight_scale": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.41.up_proj.weight": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.41.up_proj.weight_scale": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.42.down_proj.weight": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.42.down_proj.weight_scale": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.42.gate_proj.weight": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.42.gate_proj.weight_scale": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.42.up_proj.weight": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.42.up_proj.weight_scale": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.43.down_proj.weight": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.43.down_proj.weight_scale": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.43.gate_proj.weight": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.43.gate_proj.weight_scale": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.43.up_proj.weight": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.43.up_proj.weight_scale": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.44.down_proj.weight": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.44.down_proj.weight_scale": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.44.gate_proj.weight": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.44.gate_proj.weight_scale": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.44.up_proj.weight": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.44.up_proj.weight_scale": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.45.down_proj.weight": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.45.down_proj.weight_scale": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.45.gate_proj.weight": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.45.gate_proj.weight_scale": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.45.up_proj.weight": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.45.up_proj.weight_scale": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.46.down_proj.weight": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.46.down_proj.weight_scale": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.46.gate_proj.weight": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.46.gate_proj.weight_scale": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.46.up_proj.weight": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.46.up_proj.weight_scale": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.47.down_proj.weight": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.47.down_proj.weight_scale": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.47.gate_proj.weight": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.47.gate_proj.weight_scale": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.47.up_proj.weight": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.47.up_proj.weight_scale": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.48.down_proj.weight": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.48.down_proj.weight_scale": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.48.gate_proj.weight": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.48.gate_proj.weight_scale": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.48.up_proj.weight": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.48.up_proj.weight_scale": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.49.down_proj.weight": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.49.down_proj.weight_scale": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.49.gate_proj.weight": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.49.gate_proj.weight_scale": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.49.up_proj.weight": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.49.up_proj.weight_scale": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.5.down_proj.weight": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.5.down_proj.weight_scale": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.5.gate_proj.weight": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.5.gate_proj.weight_scale": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.5.up_proj.weight": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.5.up_proj.weight_scale": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.50.down_proj.weight": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.50.down_proj.weight_scale": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.50.gate_proj.weight": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.50.gate_proj.weight_scale": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.50.up_proj.weight": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.50.up_proj.weight_scale": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.51.down_proj.weight": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.51.down_proj.weight_scale": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.51.gate_proj.weight": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.51.gate_proj.weight_scale": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.51.up_proj.weight": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.51.up_proj.weight_scale": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.52.down_proj.weight": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.52.down_proj.weight_scale": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.52.gate_proj.weight": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.52.gate_proj.weight_scale": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.52.up_proj.weight": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.52.up_proj.weight_scale": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.53.down_proj.weight": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.53.down_proj.weight_scale": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.53.gate_proj.weight": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.53.gate_proj.weight_scale": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.53.up_proj.weight": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.53.up_proj.weight_scale": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.54.down_proj.weight": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.54.down_proj.weight_scale": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.54.gate_proj.weight": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.54.gate_proj.weight_scale": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.54.up_proj.weight": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.54.up_proj.weight_scale": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.55.down_proj.weight": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.55.down_proj.weight_scale": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.55.gate_proj.weight": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.55.gate_proj.weight_scale": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.55.up_proj.weight": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.55.up_proj.weight_scale": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.56.down_proj.weight": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.56.down_proj.weight_scale": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.56.gate_proj.weight": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.56.gate_proj.weight_scale": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.56.up_proj.weight": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.56.up_proj.weight_scale": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.57.down_proj.weight": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.57.down_proj.weight_scale": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.57.gate_proj.weight": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.57.gate_proj.weight_scale": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.57.up_proj.weight": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.57.up_proj.weight_scale": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.58.down_proj.weight": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.58.down_proj.weight_scale": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.58.gate_proj.weight": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.58.gate_proj.weight_scale": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.58.up_proj.weight": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.58.up_proj.weight_scale": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.59.down_proj.weight": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.59.down_proj.weight_scale": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.59.gate_proj.weight": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.59.gate_proj.weight_scale": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.59.up_proj.weight": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.59.up_proj.weight_scale": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.6.down_proj.weight": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.6.down_proj.weight_scale": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.6.gate_proj.weight": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.6.gate_proj.weight_scale": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.6.up_proj.weight": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.6.up_proj.weight_scale": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.60.down_proj.weight": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.60.down_proj.weight_scale": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.60.gate_proj.weight": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.60.gate_proj.weight_scale": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.60.up_proj.weight": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.60.up_proj.weight_scale": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.61.down_proj.weight": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.61.down_proj.weight_scale": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.61.gate_proj.weight": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.61.gate_proj.weight_scale": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.61.up_proj.weight": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.61.up_proj.weight_scale": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.62.down_proj.weight": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.62.down_proj.weight_scale": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.62.gate_proj.weight": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.62.gate_proj.weight_scale": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.62.up_proj.weight": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.62.up_proj.weight_scale": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.63.down_proj.weight": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.63.down_proj.weight_scale": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.63.gate_proj.weight": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.63.gate_proj.weight_scale": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.63.up_proj.weight": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.63.up_proj.weight_scale": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.64.down_proj.weight": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.64.down_proj.weight_scale": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.64.gate_proj.weight": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.64.gate_proj.weight_scale": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.64.up_proj.weight": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.64.up_proj.weight_scale": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.65.down_proj.weight": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.65.down_proj.weight_scale": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.65.gate_proj.weight": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.65.gate_proj.weight_scale": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.65.up_proj.weight": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.65.up_proj.weight_scale": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.66.down_proj.weight": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.66.down_proj.weight_scale": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.66.gate_proj.weight": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.66.gate_proj.weight_scale": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.66.up_proj.weight": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.66.up_proj.weight_scale": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.67.down_proj.weight": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.67.down_proj.weight_scale": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.67.gate_proj.weight": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.67.gate_proj.weight_scale": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.67.up_proj.weight": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.67.up_proj.weight_scale": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.68.down_proj.weight": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.68.down_proj.weight_scale": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.68.gate_proj.weight": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.68.gate_proj.weight_scale": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.68.up_proj.weight": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.68.up_proj.weight_scale": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.69.down_proj.weight": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.69.down_proj.weight_scale": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.69.gate_proj.weight": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.69.gate_proj.weight_scale": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.69.up_proj.weight": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.69.up_proj.weight_scale": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.7.down_proj.weight": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.7.down_proj.weight_scale": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.7.gate_proj.weight": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.7.gate_proj.weight_scale": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.7.up_proj.weight": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.7.up_proj.weight_scale": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.70.down_proj.weight": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.70.down_proj.weight_scale": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.70.gate_proj.weight": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.70.gate_proj.weight_scale": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.70.up_proj.weight": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.70.up_proj.weight_scale": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.71.down_proj.weight": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.71.down_proj.weight_scale": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.71.gate_proj.weight": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.71.gate_proj.weight_scale": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.71.up_proj.weight": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.71.up_proj.weight_scale": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.72.down_proj.weight": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.72.down_proj.weight_scale": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.72.gate_proj.weight": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.72.gate_proj.weight_scale": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.72.up_proj.weight": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.72.up_proj.weight_scale": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.73.down_proj.weight": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.73.down_proj.weight_scale": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.73.gate_proj.weight": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.73.gate_proj.weight_scale": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.73.up_proj.weight": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.73.up_proj.weight_scale": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.74.down_proj.weight": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.74.down_proj.weight_scale": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.74.gate_proj.weight": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.74.gate_proj.weight_scale": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.74.up_proj.weight": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.74.up_proj.weight_scale": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.75.down_proj.weight": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.75.down_proj.weight_scale": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.75.gate_proj.weight": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.75.gate_proj.weight_scale": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.75.up_proj.weight": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.75.up_proj.weight_scale": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.76.down_proj.weight": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.76.down_proj.weight_scale": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.76.gate_proj.weight": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.76.gate_proj.weight_scale": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.76.up_proj.weight": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.76.up_proj.weight_scale": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.77.down_proj.weight": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.77.down_proj.weight_scale": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.77.gate_proj.weight": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.77.gate_proj.weight_scale": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.77.up_proj.weight": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.77.up_proj.weight_scale": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.78.down_proj.weight": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.78.down_proj.weight_scale": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.78.gate_proj.weight": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.78.gate_proj.weight_scale": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.78.up_proj.weight": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.78.up_proj.weight_scale": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.79.down_proj.weight": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.79.down_proj.weight_scale": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.79.gate_proj.weight": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.79.gate_proj.weight_scale": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.79.up_proj.weight": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.79.up_proj.weight_scale": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.8.down_proj.weight": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.8.down_proj.weight_scale": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.8.gate_proj.weight": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.8.gate_proj.weight_scale": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.8.up_proj.weight": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.8.up_proj.weight_scale": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.80.down_proj.weight": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.80.down_proj.weight_scale": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.80.gate_proj.weight": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.80.gate_proj.weight_scale": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.80.up_proj.weight": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.80.up_proj.weight_scale": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.81.down_proj.weight": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.81.down_proj.weight_scale": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.81.gate_proj.weight": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.81.gate_proj.weight_scale": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.81.up_proj.weight": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.81.up_proj.weight_scale": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.82.down_proj.weight": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.82.down_proj.weight_scale": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.82.gate_proj.weight": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.82.gate_proj.weight_scale": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.82.up_proj.weight": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.82.up_proj.weight_scale": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.83.down_proj.weight": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.83.down_proj.weight_scale": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.83.gate_proj.weight": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.83.gate_proj.weight_scale": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.83.up_proj.weight": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.83.up_proj.weight_scale": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.84.down_proj.weight": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.84.down_proj.weight_scale": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.84.gate_proj.weight": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.84.gate_proj.weight_scale": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.84.up_proj.weight": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.84.up_proj.weight_scale": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.85.down_proj.weight": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.85.down_proj.weight_scale": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.85.gate_proj.weight": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.85.gate_proj.weight_scale": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.85.up_proj.weight": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.85.up_proj.weight_scale": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.86.down_proj.weight": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.86.down_proj.weight_scale": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.86.gate_proj.weight": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.86.gate_proj.weight_scale": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.86.up_proj.weight": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.86.up_proj.weight_scale": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.87.down_proj.weight": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.87.down_proj.weight_scale": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.87.gate_proj.weight": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.87.gate_proj.weight_scale": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.87.up_proj.weight": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.87.up_proj.weight_scale": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.88.down_proj.weight": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.88.down_proj.weight_scale": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.88.gate_proj.weight": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.88.gate_proj.weight_scale": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.88.up_proj.weight": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.88.up_proj.weight_scale": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.89.down_proj.weight": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.89.down_proj.weight_scale": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.89.gate_proj.weight": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.89.gate_proj.weight_scale": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.89.up_proj.weight": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.89.up_proj.weight_scale": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.9.down_proj.weight": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.9.down_proj.weight_scale": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.9.gate_proj.weight": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.9.gate_proj.weight_scale": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.9.up_proj.weight": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.9.up_proj.weight_scale": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.90.down_proj.weight": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.90.down_proj.weight_scale": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.90.gate_proj.weight": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.90.gate_proj.weight_scale": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.90.up_proj.weight": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.90.up_proj.weight_scale": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.91.down_proj.weight": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.91.down_proj.weight_scale": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.91.gate_proj.weight": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.91.gate_proj.weight_scale": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.91.up_proj.weight": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.91.up_proj.weight_scale": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.92.down_proj.weight": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.92.down_proj.weight_scale": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.92.gate_proj.weight": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.92.gate_proj.weight_scale": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.92.up_proj.weight": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.92.up_proj.weight_scale": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.93.down_proj.weight": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.93.down_proj.weight_scale": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.93.gate_proj.weight": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.93.gate_proj.weight_scale": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.93.up_proj.weight": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.93.up_proj.weight_scale": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.94.down_proj.weight": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.94.down_proj.weight_scale": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.94.gate_proj.weight": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.94.gate_proj.weight_scale": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.94.up_proj.weight": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.94.up_proj.weight_scale": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.95.down_proj.weight": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.95.down_proj.weight_scale": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.95.gate_proj.weight": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.95.gate_proj.weight_scale": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.95.up_proj.weight": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.95.up_proj.weight_scale": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.96.down_proj.weight": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.96.down_proj.weight_scale": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.96.gate_proj.weight": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.96.gate_proj.weight_scale": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.96.up_proj.weight": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.96.up_proj.weight_scale": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.97.down_proj.weight": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.97.down_proj.weight_scale": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.97.gate_proj.weight": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.97.gate_proj.weight_scale": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.97.up_proj.weight": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.97.up_proj.weight_scale": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.98.down_proj.weight": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.98.down_proj.weight_scale": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.98.gate_proj.weight": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.98.gate_proj.weight_scale": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.98.up_proj.weight": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.98.up_proj.weight_scale": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.99.down_proj.weight": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.99.down_proj.weight_scale": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.99.gate_proj.weight": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.99.gate_proj.weight_scale": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.99.up_proj.weight": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.99.up_proj.weight_scale": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.gate.e_score_correction_bias": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.gate.weight": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.shared_experts.down_proj.weight": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.shared_experts.down_proj.weight_scale": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.shared_experts.gate_proj.weight": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.shared_experts.gate_proj.weight_scale": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.shared_experts.up_proj.weight": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.shared_experts.up_proj.weight_scale": "model-00060-of-00092.safetensors",
+ "model.layers.59.post_attention_layernorm.weight": "model-00060-of-00092.safetensors",
+ "model.layers.59.self_attn.k_norm.weight": "model-00060-of-00092.safetensors",
+ "model.layers.59.self_attn.k_proj.bias": "model-00060-of-00092.safetensors",
+ "model.layers.59.self_attn.k_proj.weight": "model-00060-of-00092.safetensors",
+ "model.layers.59.self_attn.k_proj.weight_scale": "model-00060-of-00092.safetensors",
+ "model.layers.59.self_attn.o_proj.weight": "model-00060-of-00092.safetensors",
+ "model.layers.59.self_attn.o_proj.weight_scale": "model-00060-of-00092.safetensors",
+ "model.layers.59.self_attn.q_norm.weight": "model-00060-of-00092.safetensors",
+ "model.layers.59.self_attn.q_proj.bias": "model-00060-of-00092.safetensors",
+ "model.layers.59.self_attn.q_proj.weight": "model-00060-of-00092.safetensors",
+ "model.layers.59.self_attn.q_proj.weight_scale": "model-00060-of-00092.safetensors",
+ "model.layers.59.self_attn.v_proj.bias": "model-00060-of-00092.safetensors",
+ "model.layers.59.self_attn.v_proj.weight": "model-00060-of-00092.safetensors",
+ "model.layers.59.self_attn.v_proj.weight_scale": "model-00060-of-00092.safetensors",
+ "model.layers.60.input_layernorm.weight": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.0.down_proj.weight": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.0.down_proj.weight_scale": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.0.gate_proj.weight": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.0.gate_proj.weight_scale": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.0.up_proj.weight": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.0.up_proj.weight_scale": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.1.down_proj.weight": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.1.down_proj.weight_scale": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.1.gate_proj.weight": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.1.gate_proj.weight_scale": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.1.up_proj.weight": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.1.up_proj.weight_scale": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.10.down_proj.weight": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.10.down_proj.weight_scale": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.10.gate_proj.weight": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.10.gate_proj.weight_scale": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.10.up_proj.weight": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.10.up_proj.weight_scale": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.100.down_proj.weight": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.100.down_proj.weight_scale": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.100.gate_proj.weight": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.100.gate_proj.weight_scale": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.100.up_proj.weight": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.100.up_proj.weight_scale": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.101.down_proj.weight": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.101.down_proj.weight_scale": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.101.gate_proj.weight": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.101.gate_proj.weight_scale": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.101.up_proj.weight": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.101.up_proj.weight_scale": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.102.down_proj.weight": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.102.down_proj.weight_scale": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.102.gate_proj.weight": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.102.gate_proj.weight_scale": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.102.up_proj.weight": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.102.up_proj.weight_scale": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.103.down_proj.weight": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.103.down_proj.weight_scale": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.103.gate_proj.weight": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.103.gate_proj.weight_scale": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.103.up_proj.weight": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.103.up_proj.weight_scale": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.104.down_proj.weight": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.104.down_proj.weight_scale": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.104.gate_proj.weight": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.104.gate_proj.weight_scale": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.104.up_proj.weight": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.104.up_proj.weight_scale": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.105.down_proj.weight": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.105.down_proj.weight_scale": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.105.gate_proj.weight": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.105.gate_proj.weight_scale": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.105.up_proj.weight": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.105.up_proj.weight_scale": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.106.down_proj.weight": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.106.down_proj.weight_scale": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.106.gate_proj.weight": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.106.gate_proj.weight_scale": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.106.up_proj.weight": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.106.up_proj.weight_scale": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.107.down_proj.weight": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.107.down_proj.weight_scale": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.107.gate_proj.weight": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.107.gate_proj.weight_scale": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.107.up_proj.weight": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.107.up_proj.weight_scale": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.108.down_proj.weight": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.108.down_proj.weight_scale": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.108.gate_proj.weight": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.108.gate_proj.weight_scale": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.108.up_proj.weight": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.108.up_proj.weight_scale": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.109.down_proj.weight": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.109.down_proj.weight_scale": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.109.gate_proj.weight": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.109.gate_proj.weight_scale": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.109.up_proj.weight": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.109.up_proj.weight_scale": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.11.down_proj.weight": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.11.down_proj.weight_scale": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.11.gate_proj.weight": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.11.gate_proj.weight_scale": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.11.up_proj.weight": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.11.up_proj.weight_scale": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.110.down_proj.weight": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.110.down_proj.weight_scale": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.110.gate_proj.weight": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.110.gate_proj.weight_scale": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.110.up_proj.weight": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.110.up_proj.weight_scale": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.111.down_proj.weight": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.111.down_proj.weight_scale": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.111.gate_proj.weight": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.111.gate_proj.weight_scale": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.111.up_proj.weight": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.111.up_proj.weight_scale": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.112.down_proj.weight": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.112.down_proj.weight_scale": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.112.gate_proj.weight": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.112.gate_proj.weight_scale": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.112.up_proj.weight": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.112.up_proj.weight_scale": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.113.down_proj.weight": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.113.down_proj.weight_scale": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.113.gate_proj.weight": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.113.gate_proj.weight_scale": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.113.up_proj.weight": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.113.up_proj.weight_scale": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.114.down_proj.weight": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.114.down_proj.weight_scale": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.114.gate_proj.weight": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.114.gate_proj.weight_scale": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.114.up_proj.weight": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.114.up_proj.weight_scale": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.115.down_proj.weight": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.115.down_proj.weight_scale": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.115.gate_proj.weight": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.115.gate_proj.weight_scale": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.115.up_proj.weight": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.115.up_proj.weight_scale": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.116.down_proj.weight": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.116.down_proj.weight_scale": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.116.gate_proj.weight": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.116.gate_proj.weight_scale": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.116.up_proj.weight": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.116.up_proj.weight_scale": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.117.down_proj.weight": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.117.down_proj.weight_scale": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.117.gate_proj.weight": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.117.gate_proj.weight_scale": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.117.up_proj.weight": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.117.up_proj.weight_scale": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.118.down_proj.weight": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.118.down_proj.weight_scale": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.118.gate_proj.weight": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.118.gate_proj.weight_scale": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.118.up_proj.weight": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.118.up_proj.weight_scale": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.119.down_proj.weight": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.119.down_proj.weight_scale": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.119.gate_proj.weight": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.119.gate_proj.weight_scale": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.119.up_proj.weight": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.119.up_proj.weight_scale": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.12.down_proj.weight": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.12.down_proj.weight_scale": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.12.gate_proj.weight": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.12.gate_proj.weight_scale": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.12.up_proj.weight": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.12.up_proj.weight_scale": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.120.down_proj.weight": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.120.down_proj.weight_scale": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.120.gate_proj.weight": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.120.gate_proj.weight_scale": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.120.up_proj.weight": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.120.up_proj.weight_scale": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.121.down_proj.weight": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.121.down_proj.weight_scale": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.121.gate_proj.weight": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.121.gate_proj.weight_scale": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.121.up_proj.weight": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.121.up_proj.weight_scale": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.122.down_proj.weight": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.122.down_proj.weight_scale": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.122.gate_proj.weight": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.122.gate_proj.weight_scale": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.122.up_proj.weight": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.122.up_proj.weight_scale": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.123.down_proj.weight": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.123.down_proj.weight_scale": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.123.gate_proj.weight": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.123.gate_proj.weight_scale": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.123.up_proj.weight": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.123.up_proj.weight_scale": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.124.down_proj.weight": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.124.down_proj.weight_scale": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.124.gate_proj.weight": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.124.gate_proj.weight_scale": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.124.up_proj.weight": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.124.up_proj.weight_scale": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.125.down_proj.weight": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.125.down_proj.weight_scale": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.125.gate_proj.weight": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.125.gate_proj.weight_scale": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.125.up_proj.weight": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.125.up_proj.weight_scale": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.126.down_proj.weight": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.126.down_proj.weight_scale": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.126.gate_proj.weight": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.126.gate_proj.weight_scale": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.126.up_proj.weight": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.126.up_proj.weight_scale": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.127.down_proj.weight": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.127.down_proj.weight_scale": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.127.gate_proj.weight": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.127.gate_proj.weight_scale": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.127.up_proj.weight": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.127.up_proj.weight_scale": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.128.down_proj.weight": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.128.down_proj.weight_scale": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.128.gate_proj.weight": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.128.gate_proj.weight_scale": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.128.up_proj.weight": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.128.up_proj.weight_scale": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.129.down_proj.weight": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.129.down_proj.weight_scale": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.129.gate_proj.weight": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.129.gate_proj.weight_scale": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.129.up_proj.weight": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.129.up_proj.weight_scale": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.13.down_proj.weight": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.13.down_proj.weight_scale": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.13.gate_proj.weight": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.13.gate_proj.weight_scale": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.13.up_proj.weight": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.13.up_proj.weight_scale": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.130.down_proj.weight": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.130.down_proj.weight_scale": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.130.gate_proj.weight": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.130.gate_proj.weight_scale": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.130.up_proj.weight": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.130.up_proj.weight_scale": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.131.down_proj.weight": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.131.down_proj.weight_scale": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.131.gate_proj.weight": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.131.gate_proj.weight_scale": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.131.up_proj.weight": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.131.up_proj.weight_scale": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.132.down_proj.weight": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.132.down_proj.weight_scale": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.132.gate_proj.weight": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.132.gate_proj.weight_scale": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.132.up_proj.weight": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.132.up_proj.weight_scale": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.133.down_proj.weight": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.133.down_proj.weight_scale": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.133.gate_proj.weight": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.133.gate_proj.weight_scale": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.133.up_proj.weight": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.133.up_proj.weight_scale": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.134.down_proj.weight": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.134.down_proj.weight_scale": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.134.gate_proj.weight": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.134.gate_proj.weight_scale": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.134.up_proj.weight": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.134.up_proj.weight_scale": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.135.down_proj.weight": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.135.down_proj.weight_scale": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.135.gate_proj.weight": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.135.gate_proj.weight_scale": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.135.up_proj.weight": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.135.up_proj.weight_scale": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.136.down_proj.weight": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.136.down_proj.weight_scale": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.136.gate_proj.weight": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.136.gate_proj.weight_scale": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.136.up_proj.weight": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.136.up_proj.weight_scale": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.137.down_proj.weight": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.137.down_proj.weight_scale": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.137.gate_proj.weight": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.137.gate_proj.weight_scale": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.137.up_proj.weight": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.137.up_proj.weight_scale": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.138.down_proj.weight": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.138.down_proj.weight_scale": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.138.gate_proj.weight": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.138.gate_proj.weight_scale": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.138.up_proj.weight": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.138.up_proj.weight_scale": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.139.down_proj.weight": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.139.down_proj.weight_scale": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.139.gate_proj.weight": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.139.gate_proj.weight_scale": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.139.up_proj.weight": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.139.up_proj.weight_scale": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.14.down_proj.weight": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.14.down_proj.weight_scale": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.14.gate_proj.weight": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.14.gate_proj.weight_scale": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.14.up_proj.weight": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.14.up_proj.weight_scale": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.140.down_proj.weight": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.140.down_proj.weight_scale": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.140.gate_proj.weight": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.140.gate_proj.weight_scale": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.140.up_proj.weight": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.140.up_proj.weight_scale": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.141.down_proj.weight": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.141.down_proj.weight_scale": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.141.gate_proj.weight": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.141.gate_proj.weight_scale": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.141.up_proj.weight": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.141.up_proj.weight_scale": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.142.down_proj.weight": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.142.down_proj.weight_scale": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.142.gate_proj.weight": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.142.gate_proj.weight_scale": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.142.up_proj.weight": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.142.up_proj.weight_scale": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.143.down_proj.weight": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.143.down_proj.weight_scale": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.143.gate_proj.weight": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.143.gate_proj.weight_scale": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.143.up_proj.weight": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.143.up_proj.weight_scale": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.144.down_proj.weight": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.144.down_proj.weight_scale": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.144.gate_proj.weight": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.144.gate_proj.weight_scale": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.144.up_proj.weight": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.144.up_proj.weight_scale": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.145.down_proj.weight": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.145.down_proj.weight_scale": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.145.gate_proj.weight": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.145.gate_proj.weight_scale": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.145.up_proj.weight": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.145.up_proj.weight_scale": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.146.down_proj.weight": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.146.down_proj.weight_scale": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.146.gate_proj.weight": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.146.gate_proj.weight_scale": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.146.up_proj.weight": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.146.up_proj.weight_scale": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.147.down_proj.weight": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.147.down_proj.weight_scale": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.147.gate_proj.weight": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.147.gate_proj.weight_scale": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.147.up_proj.weight": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.147.up_proj.weight_scale": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.148.down_proj.weight": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.148.down_proj.weight_scale": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.148.gate_proj.weight": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.148.gate_proj.weight_scale": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.148.up_proj.weight": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.148.up_proj.weight_scale": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.149.down_proj.weight": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.149.down_proj.weight_scale": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.149.gate_proj.weight": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.149.gate_proj.weight_scale": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.149.up_proj.weight": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.149.up_proj.weight_scale": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.15.down_proj.weight": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.15.down_proj.weight_scale": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.15.gate_proj.weight": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.15.gate_proj.weight_scale": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.15.up_proj.weight": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.15.up_proj.weight_scale": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.150.down_proj.weight": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.150.down_proj.weight_scale": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.150.gate_proj.weight": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.150.gate_proj.weight_scale": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.150.up_proj.weight": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.150.up_proj.weight_scale": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.151.down_proj.weight": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.151.down_proj.weight_scale": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.151.gate_proj.weight": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.151.gate_proj.weight_scale": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.151.up_proj.weight": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.151.up_proj.weight_scale": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.152.down_proj.weight": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.152.down_proj.weight_scale": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.152.gate_proj.weight": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.152.gate_proj.weight_scale": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.152.up_proj.weight": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.152.up_proj.weight_scale": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.153.down_proj.weight": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.153.down_proj.weight_scale": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.153.gate_proj.weight": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.153.gate_proj.weight_scale": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.153.up_proj.weight": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.153.up_proj.weight_scale": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.154.down_proj.weight": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.154.down_proj.weight_scale": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.154.gate_proj.weight": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.154.gate_proj.weight_scale": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.154.up_proj.weight": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.154.up_proj.weight_scale": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.155.down_proj.weight": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.155.down_proj.weight_scale": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.155.gate_proj.weight": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.155.gate_proj.weight_scale": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.155.up_proj.weight": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.155.up_proj.weight_scale": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.156.down_proj.weight": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.156.down_proj.weight_scale": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.156.gate_proj.weight": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.156.gate_proj.weight_scale": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.156.up_proj.weight": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.156.up_proj.weight_scale": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.157.down_proj.weight": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.157.down_proj.weight_scale": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.157.gate_proj.weight": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.157.gate_proj.weight_scale": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.157.up_proj.weight": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.157.up_proj.weight_scale": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.158.down_proj.weight": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.158.down_proj.weight_scale": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.158.gate_proj.weight": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.158.gate_proj.weight_scale": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.158.up_proj.weight": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.158.up_proj.weight_scale": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.159.down_proj.weight": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.159.down_proj.weight_scale": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.159.gate_proj.weight": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.159.gate_proj.weight_scale": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.159.up_proj.weight": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.159.up_proj.weight_scale": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.16.down_proj.weight": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.16.down_proj.weight_scale": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.16.gate_proj.weight": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.16.gate_proj.weight_scale": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.16.up_proj.weight": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.16.up_proj.weight_scale": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.17.down_proj.weight": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.17.down_proj.weight_scale": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.17.gate_proj.weight": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.17.gate_proj.weight_scale": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.17.up_proj.weight": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.17.up_proj.weight_scale": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.18.down_proj.weight": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.18.down_proj.weight_scale": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.18.gate_proj.weight": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.18.gate_proj.weight_scale": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.18.up_proj.weight": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.18.up_proj.weight_scale": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.19.down_proj.weight": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.19.down_proj.weight_scale": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.19.gate_proj.weight": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.19.gate_proj.weight_scale": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.19.up_proj.weight": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.19.up_proj.weight_scale": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.2.down_proj.weight": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.2.down_proj.weight_scale": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.2.gate_proj.weight": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.2.gate_proj.weight_scale": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.2.up_proj.weight": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.2.up_proj.weight_scale": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.20.down_proj.weight": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.20.down_proj.weight_scale": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.20.gate_proj.weight": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.20.gate_proj.weight_scale": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.20.up_proj.weight": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.20.up_proj.weight_scale": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.21.down_proj.weight": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.21.down_proj.weight_scale": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.21.gate_proj.weight": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.21.gate_proj.weight_scale": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.21.up_proj.weight": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.21.up_proj.weight_scale": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.22.down_proj.weight": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.22.down_proj.weight_scale": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.22.gate_proj.weight": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.22.gate_proj.weight_scale": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.22.up_proj.weight": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.22.up_proj.weight_scale": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.23.down_proj.weight": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.23.down_proj.weight_scale": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.23.gate_proj.weight": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.23.gate_proj.weight_scale": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.23.up_proj.weight": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.23.up_proj.weight_scale": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.24.down_proj.weight": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.24.down_proj.weight_scale": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.24.gate_proj.weight": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.24.gate_proj.weight_scale": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.24.up_proj.weight": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.24.up_proj.weight_scale": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.25.down_proj.weight": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.25.down_proj.weight_scale": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.25.gate_proj.weight": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.25.gate_proj.weight_scale": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.25.up_proj.weight": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.25.up_proj.weight_scale": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.26.down_proj.weight": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.26.down_proj.weight_scale": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.26.gate_proj.weight": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.26.gate_proj.weight_scale": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.26.up_proj.weight": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.26.up_proj.weight_scale": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.27.down_proj.weight": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.27.down_proj.weight_scale": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.27.gate_proj.weight": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.27.gate_proj.weight_scale": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.27.up_proj.weight": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.27.up_proj.weight_scale": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.28.down_proj.weight": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.28.down_proj.weight_scale": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.28.gate_proj.weight": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.28.gate_proj.weight_scale": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.28.up_proj.weight": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.28.up_proj.weight_scale": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.29.down_proj.weight": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.29.down_proj.weight_scale": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.29.gate_proj.weight": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.29.gate_proj.weight_scale": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.29.up_proj.weight": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.29.up_proj.weight_scale": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.3.down_proj.weight": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.3.down_proj.weight_scale": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.3.gate_proj.weight": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.3.gate_proj.weight_scale": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.3.up_proj.weight": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.3.up_proj.weight_scale": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.30.down_proj.weight": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.30.down_proj.weight_scale": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.30.gate_proj.weight": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.30.gate_proj.weight_scale": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.30.up_proj.weight": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.30.up_proj.weight_scale": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.31.down_proj.weight": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.31.down_proj.weight_scale": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.31.gate_proj.weight": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.31.gate_proj.weight_scale": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.31.up_proj.weight": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.31.up_proj.weight_scale": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.32.down_proj.weight": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.32.down_proj.weight_scale": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.32.gate_proj.weight": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.32.gate_proj.weight_scale": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.32.up_proj.weight": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.32.up_proj.weight_scale": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.33.down_proj.weight": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.33.down_proj.weight_scale": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.33.gate_proj.weight": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.33.gate_proj.weight_scale": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.33.up_proj.weight": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.33.up_proj.weight_scale": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.34.down_proj.weight": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.34.down_proj.weight_scale": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.34.gate_proj.weight": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.34.gate_proj.weight_scale": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.34.up_proj.weight": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.34.up_proj.weight_scale": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.35.down_proj.weight": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.35.down_proj.weight_scale": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.35.gate_proj.weight": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.35.gate_proj.weight_scale": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.35.up_proj.weight": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.35.up_proj.weight_scale": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.36.down_proj.weight": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.36.down_proj.weight_scale": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.36.gate_proj.weight": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.36.gate_proj.weight_scale": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.36.up_proj.weight": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.36.up_proj.weight_scale": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.37.down_proj.weight": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.37.down_proj.weight_scale": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.37.gate_proj.weight": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.37.gate_proj.weight_scale": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.37.up_proj.weight": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.37.up_proj.weight_scale": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.38.down_proj.weight": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.38.down_proj.weight_scale": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.38.gate_proj.weight": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.38.gate_proj.weight_scale": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.38.up_proj.weight": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.38.up_proj.weight_scale": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.39.down_proj.weight": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.39.down_proj.weight_scale": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.39.gate_proj.weight": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.39.gate_proj.weight_scale": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.39.up_proj.weight": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.39.up_proj.weight_scale": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.4.down_proj.weight": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.4.down_proj.weight_scale": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.4.gate_proj.weight": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.4.gate_proj.weight_scale": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.4.up_proj.weight": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.4.up_proj.weight_scale": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.40.down_proj.weight": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.40.down_proj.weight_scale": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.40.gate_proj.weight": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.40.gate_proj.weight_scale": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.40.up_proj.weight": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.40.up_proj.weight_scale": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.41.down_proj.weight": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.41.down_proj.weight_scale": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.41.gate_proj.weight": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.41.gate_proj.weight_scale": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.41.up_proj.weight": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.41.up_proj.weight_scale": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.42.down_proj.weight": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.42.down_proj.weight_scale": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.42.gate_proj.weight": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.42.gate_proj.weight_scale": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.42.up_proj.weight": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.42.up_proj.weight_scale": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.43.down_proj.weight": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.43.down_proj.weight_scale": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.43.gate_proj.weight": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.43.gate_proj.weight_scale": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.43.up_proj.weight": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.43.up_proj.weight_scale": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.44.down_proj.weight": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.44.down_proj.weight_scale": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.44.gate_proj.weight": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.44.gate_proj.weight_scale": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.44.up_proj.weight": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.44.up_proj.weight_scale": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.45.down_proj.weight": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.45.down_proj.weight_scale": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.45.gate_proj.weight": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.45.gate_proj.weight_scale": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.45.up_proj.weight": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.45.up_proj.weight_scale": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.46.down_proj.weight": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.46.down_proj.weight_scale": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.46.gate_proj.weight": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.46.gate_proj.weight_scale": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.46.up_proj.weight": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.46.up_proj.weight_scale": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.47.down_proj.weight": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.47.down_proj.weight_scale": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.47.gate_proj.weight": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.47.gate_proj.weight_scale": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.47.up_proj.weight": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.47.up_proj.weight_scale": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.48.down_proj.weight": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.48.down_proj.weight_scale": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.48.gate_proj.weight": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.48.gate_proj.weight_scale": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.48.up_proj.weight": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.48.up_proj.weight_scale": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.49.down_proj.weight": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.49.down_proj.weight_scale": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.49.gate_proj.weight": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.49.gate_proj.weight_scale": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.49.up_proj.weight": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.49.up_proj.weight_scale": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.5.down_proj.weight": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.5.down_proj.weight_scale": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.5.gate_proj.weight": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.5.gate_proj.weight_scale": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.5.up_proj.weight": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.5.up_proj.weight_scale": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.50.down_proj.weight": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.50.down_proj.weight_scale": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.50.gate_proj.weight": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.50.gate_proj.weight_scale": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.50.up_proj.weight": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.50.up_proj.weight_scale": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.51.down_proj.weight": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.51.down_proj.weight_scale": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.51.gate_proj.weight": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.51.gate_proj.weight_scale": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.51.up_proj.weight": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.51.up_proj.weight_scale": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.52.down_proj.weight": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.52.down_proj.weight_scale": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.52.gate_proj.weight": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.52.gate_proj.weight_scale": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.52.up_proj.weight": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.52.up_proj.weight_scale": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.53.down_proj.weight": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.53.down_proj.weight_scale": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.53.gate_proj.weight": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.53.gate_proj.weight_scale": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.53.up_proj.weight": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.53.up_proj.weight_scale": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.54.down_proj.weight": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.54.down_proj.weight_scale": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.54.gate_proj.weight": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.54.gate_proj.weight_scale": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.54.up_proj.weight": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.54.up_proj.weight_scale": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.55.down_proj.weight": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.55.down_proj.weight_scale": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.55.gate_proj.weight": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.55.gate_proj.weight_scale": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.55.up_proj.weight": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.55.up_proj.weight_scale": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.56.down_proj.weight": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.56.down_proj.weight_scale": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.56.gate_proj.weight": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.56.gate_proj.weight_scale": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.56.up_proj.weight": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.56.up_proj.weight_scale": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.57.down_proj.weight": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.57.down_proj.weight_scale": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.57.gate_proj.weight": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.57.gate_proj.weight_scale": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.57.up_proj.weight": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.57.up_proj.weight_scale": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.58.down_proj.weight": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.58.down_proj.weight_scale": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.58.gate_proj.weight": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.58.gate_proj.weight_scale": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.58.up_proj.weight": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.58.up_proj.weight_scale": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.59.down_proj.weight": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.59.down_proj.weight_scale": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.59.gate_proj.weight": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.59.gate_proj.weight_scale": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.59.up_proj.weight": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.59.up_proj.weight_scale": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.6.down_proj.weight": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.6.down_proj.weight_scale": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.6.gate_proj.weight": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.6.gate_proj.weight_scale": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.6.up_proj.weight": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.6.up_proj.weight_scale": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.60.down_proj.weight": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.60.down_proj.weight_scale": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.60.gate_proj.weight": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.60.gate_proj.weight_scale": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.60.up_proj.weight": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.60.up_proj.weight_scale": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.61.down_proj.weight": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.61.down_proj.weight_scale": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.61.gate_proj.weight": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.61.gate_proj.weight_scale": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.61.up_proj.weight": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.61.up_proj.weight_scale": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.62.down_proj.weight": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.62.down_proj.weight_scale": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.62.gate_proj.weight": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.62.gate_proj.weight_scale": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.62.up_proj.weight": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.62.up_proj.weight_scale": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.63.down_proj.weight": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.63.down_proj.weight_scale": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.63.gate_proj.weight": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.63.gate_proj.weight_scale": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.63.up_proj.weight": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.63.up_proj.weight_scale": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.64.down_proj.weight": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.64.down_proj.weight_scale": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.64.gate_proj.weight": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.64.gate_proj.weight_scale": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.64.up_proj.weight": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.64.up_proj.weight_scale": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.65.down_proj.weight": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.65.down_proj.weight_scale": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.65.gate_proj.weight": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.65.gate_proj.weight_scale": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.65.up_proj.weight": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.65.up_proj.weight_scale": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.66.down_proj.weight": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.66.down_proj.weight_scale": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.66.gate_proj.weight": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.66.gate_proj.weight_scale": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.66.up_proj.weight": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.66.up_proj.weight_scale": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.67.down_proj.weight": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.67.down_proj.weight_scale": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.67.gate_proj.weight": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.67.gate_proj.weight_scale": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.67.up_proj.weight": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.67.up_proj.weight_scale": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.68.down_proj.weight": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.68.down_proj.weight_scale": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.68.gate_proj.weight": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.68.gate_proj.weight_scale": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.68.up_proj.weight": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.68.up_proj.weight_scale": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.69.down_proj.weight": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.69.down_proj.weight_scale": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.69.gate_proj.weight": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.69.gate_proj.weight_scale": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.69.up_proj.weight": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.69.up_proj.weight_scale": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.7.down_proj.weight": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.7.down_proj.weight_scale": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.7.gate_proj.weight": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.7.gate_proj.weight_scale": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.7.up_proj.weight": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.7.up_proj.weight_scale": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.70.down_proj.weight": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.70.down_proj.weight_scale": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.70.gate_proj.weight": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.70.gate_proj.weight_scale": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.70.up_proj.weight": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.70.up_proj.weight_scale": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.71.down_proj.weight": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.71.down_proj.weight_scale": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.71.gate_proj.weight": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.71.gate_proj.weight_scale": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.71.up_proj.weight": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.71.up_proj.weight_scale": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.72.down_proj.weight": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.72.down_proj.weight_scale": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.72.gate_proj.weight": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.72.gate_proj.weight_scale": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.72.up_proj.weight": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.72.up_proj.weight_scale": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.73.down_proj.weight": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.73.down_proj.weight_scale": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.73.gate_proj.weight": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.73.gate_proj.weight_scale": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.73.up_proj.weight": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.73.up_proj.weight_scale": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.74.down_proj.weight": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.74.down_proj.weight_scale": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.74.gate_proj.weight": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.74.gate_proj.weight_scale": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.74.up_proj.weight": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.74.up_proj.weight_scale": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.75.down_proj.weight": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.75.down_proj.weight_scale": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.75.gate_proj.weight": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.75.gate_proj.weight_scale": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.75.up_proj.weight": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.75.up_proj.weight_scale": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.76.down_proj.weight": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.76.down_proj.weight_scale": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.76.gate_proj.weight": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.76.gate_proj.weight_scale": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.76.up_proj.weight": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.76.up_proj.weight_scale": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.77.down_proj.weight": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.77.down_proj.weight_scale": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.77.gate_proj.weight": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.77.gate_proj.weight_scale": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.77.up_proj.weight": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.77.up_proj.weight_scale": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.78.down_proj.weight": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.78.down_proj.weight_scale": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.78.gate_proj.weight": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.78.gate_proj.weight_scale": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.78.up_proj.weight": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.78.up_proj.weight_scale": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.79.down_proj.weight": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.79.down_proj.weight_scale": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.79.gate_proj.weight": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.79.gate_proj.weight_scale": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.79.up_proj.weight": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.79.up_proj.weight_scale": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.8.down_proj.weight": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.8.down_proj.weight_scale": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.8.gate_proj.weight": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.8.gate_proj.weight_scale": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.8.up_proj.weight": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.8.up_proj.weight_scale": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.80.down_proj.weight": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.80.down_proj.weight_scale": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.80.gate_proj.weight": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.80.gate_proj.weight_scale": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.80.up_proj.weight": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.80.up_proj.weight_scale": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.81.down_proj.weight": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.81.down_proj.weight_scale": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.81.gate_proj.weight": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.81.gate_proj.weight_scale": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.81.up_proj.weight": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.81.up_proj.weight_scale": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.82.down_proj.weight": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.82.down_proj.weight_scale": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.82.gate_proj.weight": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.82.gate_proj.weight_scale": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.82.up_proj.weight": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.82.up_proj.weight_scale": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.83.down_proj.weight": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.83.down_proj.weight_scale": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.83.gate_proj.weight": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.83.gate_proj.weight_scale": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.83.up_proj.weight": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.83.up_proj.weight_scale": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.84.down_proj.weight": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.84.down_proj.weight_scale": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.84.gate_proj.weight": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.84.gate_proj.weight_scale": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.84.up_proj.weight": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.84.up_proj.weight_scale": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.85.down_proj.weight": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.85.down_proj.weight_scale": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.85.gate_proj.weight": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.85.gate_proj.weight_scale": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.85.up_proj.weight": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.85.up_proj.weight_scale": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.86.down_proj.weight": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.86.down_proj.weight_scale": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.86.gate_proj.weight": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.86.gate_proj.weight_scale": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.86.up_proj.weight": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.86.up_proj.weight_scale": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.87.down_proj.weight": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.87.down_proj.weight_scale": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.87.gate_proj.weight": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.87.gate_proj.weight_scale": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.87.up_proj.weight": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.87.up_proj.weight_scale": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.88.down_proj.weight": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.88.down_proj.weight_scale": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.88.gate_proj.weight": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.88.gate_proj.weight_scale": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.88.up_proj.weight": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.88.up_proj.weight_scale": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.89.down_proj.weight": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.89.down_proj.weight_scale": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.89.gate_proj.weight": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.89.gate_proj.weight_scale": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.89.up_proj.weight": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.89.up_proj.weight_scale": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.9.down_proj.weight": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.9.down_proj.weight_scale": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.9.gate_proj.weight": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.9.gate_proj.weight_scale": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.9.up_proj.weight": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.9.up_proj.weight_scale": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.90.down_proj.weight": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.90.down_proj.weight_scale": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.90.gate_proj.weight": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.90.gate_proj.weight_scale": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.90.up_proj.weight": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.90.up_proj.weight_scale": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.91.down_proj.weight": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.91.down_proj.weight_scale": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.91.gate_proj.weight": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.91.gate_proj.weight_scale": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.91.up_proj.weight": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.91.up_proj.weight_scale": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.92.down_proj.weight": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.92.down_proj.weight_scale": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.92.gate_proj.weight": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.92.gate_proj.weight_scale": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.92.up_proj.weight": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.92.up_proj.weight_scale": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.93.down_proj.weight": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.93.down_proj.weight_scale": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.93.gate_proj.weight": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.93.gate_proj.weight_scale": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.93.up_proj.weight": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.93.up_proj.weight_scale": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.94.down_proj.weight": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.94.down_proj.weight_scale": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.94.gate_proj.weight": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.94.gate_proj.weight_scale": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.94.up_proj.weight": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.94.up_proj.weight_scale": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.95.down_proj.weight": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.95.down_proj.weight_scale": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.95.gate_proj.weight": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.95.gate_proj.weight_scale": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.95.up_proj.weight": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.95.up_proj.weight_scale": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.96.down_proj.weight": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.96.down_proj.weight_scale": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.96.gate_proj.weight": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.96.gate_proj.weight_scale": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.96.up_proj.weight": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.96.up_proj.weight_scale": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.97.down_proj.weight": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.97.down_proj.weight_scale": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.97.gate_proj.weight": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.97.gate_proj.weight_scale": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.97.up_proj.weight": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.97.up_proj.weight_scale": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.98.down_proj.weight": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.98.down_proj.weight_scale": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.98.gate_proj.weight": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.98.gate_proj.weight_scale": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.98.up_proj.weight": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.98.up_proj.weight_scale": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.99.down_proj.weight": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.99.down_proj.weight_scale": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.99.gate_proj.weight": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.99.gate_proj.weight_scale": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.99.up_proj.weight": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.99.up_proj.weight_scale": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.gate.e_score_correction_bias": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.gate.weight": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.shared_experts.down_proj.weight": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.shared_experts.down_proj.weight_scale": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.shared_experts.gate_proj.weight": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.shared_experts.gate_proj.weight_scale": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.shared_experts.up_proj.weight": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.shared_experts.up_proj.weight_scale": "model-00061-of-00092.safetensors",
+ "model.layers.60.post_attention_layernorm.weight": "model-00061-of-00092.safetensors",
+ "model.layers.60.self_attn.k_norm.weight": "model-00061-of-00092.safetensors",
+ "model.layers.60.self_attn.k_proj.bias": "model-00061-of-00092.safetensors",
+ "model.layers.60.self_attn.k_proj.weight": "model-00061-of-00092.safetensors",
+ "model.layers.60.self_attn.k_proj.weight_scale": "model-00061-of-00092.safetensors",
+ "model.layers.60.self_attn.o_proj.weight": "model-00061-of-00092.safetensors",
+ "model.layers.60.self_attn.o_proj.weight_scale": "model-00061-of-00092.safetensors",
+ "model.layers.60.self_attn.q_norm.weight": "model-00061-of-00092.safetensors",
+ "model.layers.60.self_attn.q_proj.bias": "model-00061-of-00092.safetensors",
+ "model.layers.60.self_attn.q_proj.weight": "model-00061-of-00092.safetensors",
+ "model.layers.60.self_attn.q_proj.weight_scale": "model-00061-of-00092.safetensors",
+ "model.layers.60.self_attn.v_proj.bias": "model-00061-of-00092.safetensors",
+ "model.layers.60.self_attn.v_proj.weight": "model-00061-of-00092.safetensors",
+ "model.layers.60.self_attn.v_proj.weight_scale": "model-00061-of-00092.safetensors",
+ "model.layers.61.input_layernorm.weight": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.0.down_proj.weight": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.0.down_proj.weight_scale": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.0.gate_proj.weight": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.0.gate_proj.weight_scale": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.0.up_proj.weight": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.0.up_proj.weight_scale": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.1.down_proj.weight": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.1.down_proj.weight_scale": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.1.gate_proj.weight": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.1.gate_proj.weight_scale": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.1.up_proj.weight": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.1.up_proj.weight_scale": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.10.down_proj.weight": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.10.down_proj.weight_scale": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.10.gate_proj.weight": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.10.gate_proj.weight_scale": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.10.up_proj.weight": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.10.up_proj.weight_scale": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.100.down_proj.weight": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.100.down_proj.weight_scale": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.100.gate_proj.weight": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.100.gate_proj.weight_scale": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.100.up_proj.weight": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.100.up_proj.weight_scale": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.101.down_proj.weight": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.101.down_proj.weight_scale": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.101.gate_proj.weight": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.101.gate_proj.weight_scale": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.101.up_proj.weight": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.101.up_proj.weight_scale": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.102.down_proj.weight": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.102.down_proj.weight_scale": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.102.gate_proj.weight": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.102.gate_proj.weight_scale": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.102.up_proj.weight": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.102.up_proj.weight_scale": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.103.down_proj.weight": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.103.down_proj.weight_scale": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.103.gate_proj.weight": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.103.gate_proj.weight_scale": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.103.up_proj.weight": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.103.up_proj.weight_scale": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.104.down_proj.weight": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.104.down_proj.weight_scale": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.104.gate_proj.weight": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.104.gate_proj.weight_scale": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.104.up_proj.weight": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.104.up_proj.weight_scale": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.105.down_proj.weight": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.105.down_proj.weight_scale": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.105.gate_proj.weight": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.105.gate_proj.weight_scale": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.105.up_proj.weight": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.105.up_proj.weight_scale": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.106.down_proj.weight": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.106.down_proj.weight_scale": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.106.gate_proj.weight": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.106.gate_proj.weight_scale": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.106.up_proj.weight": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.106.up_proj.weight_scale": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.107.down_proj.weight": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.107.down_proj.weight_scale": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.107.gate_proj.weight": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.107.gate_proj.weight_scale": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.107.up_proj.weight": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.107.up_proj.weight_scale": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.108.down_proj.weight": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.108.down_proj.weight_scale": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.108.gate_proj.weight": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.108.gate_proj.weight_scale": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.108.up_proj.weight": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.108.up_proj.weight_scale": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.109.down_proj.weight": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.109.down_proj.weight_scale": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.109.gate_proj.weight": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.109.gate_proj.weight_scale": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.109.up_proj.weight": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.109.up_proj.weight_scale": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.11.down_proj.weight": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.11.down_proj.weight_scale": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.11.gate_proj.weight": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.11.gate_proj.weight_scale": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.11.up_proj.weight": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.11.up_proj.weight_scale": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.110.down_proj.weight": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.110.down_proj.weight_scale": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.110.gate_proj.weight": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.110.gate_proj.weight_scale": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.110.up_proj.weight": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.110.up_proj.weight_scale": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.111.down_proj.weight": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.111.down_proj.weight_scale": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.111.gate_proj.weight": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.111.gate_proj.weight_scale": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.111.up_proj.weight": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.111.up_proj.weight_scale": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.112.down_proj.weight": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.112.down_proj.weight_scale": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.112.gate_proj.weight": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.112.gate_proj.weight_scale": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.112.up_proj.weight": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.112.up_proj.weight_scale": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.113.down_proj.weight": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.113.down_proj.weight_scale": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.113.gate_proj.weight": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.113.gate_proj.weight_scale": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.113.up_proj.weight": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.113.up_proj.weight_scale": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.114.down_proj.weight": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.114.down_proj.weight_scale": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.114.gate_proj.weight": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.114.gate_proj.weight_scale": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.114.up_proj.weight": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.114.up_proj.weight_scale": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.115.down_proj.weight": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.115.down_proj.weight_scale": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.115.gate_proj.weight": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.115.gate_proj.weight_scale": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.115.up_proj.weight": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.115.up_proj.weight_scale": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.116.down_proj.weight": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.116.down_proj.weight_scale": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.116.gate_proj.weight": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.116.gate_proj.weight_scale": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.116.up_proj.weight": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.116.up_proj.weight_scale": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.117.down_proj.weight": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.117.down_proj.weight_scale": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.117.gate_proj.weight": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.117.gate_proj.weight_scale": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.117.up_proj.weight": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.117.up_proj.weight_scale": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.118.down_proj.weight": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.118.down_proj.weight_scale": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.118.gate_proj.weight": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.118.gate_proj.weight_scale": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.118.up_proj.weight": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.118.up_proj.weight_scale": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.119.down_proj.weight": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.119.down_proj.weight_scale": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.119.gate_proj.weight": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.119.gate_proj.weight_scale": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.119.up_proj.weight": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.119.up_proj.weight_scale": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.12.down_proj.weight": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.12.down_proj.weight_scale": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.12.gate_proj.weight": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.12.gate_proj.weight_scale": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.12.up_proj.weight": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.12.up_proj.weight_scale": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.120.down_proj.weight": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.120.down_proj.weight_scale": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.120.gate_proj.weight": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.120.gate_proj.weight_scale": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.120.up_proj.weight": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.120.up_proj.weight_scale": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.121.down_proj.weight": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.121.down_proj.weight_scale": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.121.gate_proj.weight": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.121.gate_proj.weight_scale": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.121.up_proj.weight": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.121.up_proj.weight_scale": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.122.down_proj.weight": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.122.down_proj.weight_scale": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.122.gate_proj.weight": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.122.gate_proj.weight_scale": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.122.up_proj.weight": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.122.up_proj.weight_scale": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.123.down_proj.weight": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.123.down_proj.weight_scale": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.123.gate_proj.weight": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.123.gate_proj.weight_scale": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.123.up_proj.weight": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.123.up_proj.weight_scale": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.124.down_proj.weight": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.124.down_proj.weight_scale": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.124.gate_proj.weight": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.124.gate_proj.weight_scale": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.124.up_proj.weight": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.124.up_proj.weight_scale": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.125.down_proj.weight": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.125.down_proj.weight_scale": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.125.gate_proj.weight": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.125.gate_proj.weight_scale": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.125.up_proj.weight": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.125.up_proj.weight_scale": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.126.down_proj.weight": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.126.down_proj.weight_scale": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.126.gate_proj.weight": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.126.gate_proj.weight_scale": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.126.up_proj.weight": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.126.up_proj.weight_scale": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.127.down_proj.weight": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.127.down_proj.weight_scale": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.127.gate_proj.weight": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.127.gate_proj.weight_scale": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.127.up_proj.weight": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.127.up_proj.weight_scale": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.128.down_proj.weight": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.128.down_proj.weight_scale": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.128.gate_proj.weight": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.128.gate_proj.weight_scale": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.128.up_proj.weight": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.128.up_proj.weight_scale": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.129.down_proj.weight": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.129.down_proj.weight_scale": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.129.gate_proj.weight": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.129.gate_proj.weight_scale": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.129.up_proj.weight": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.129.up_proj.weight_scale": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.13.down_proj.weight": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.13.down_proj.weight_scale": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.13.gate_proj.weight": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.13.gate_proj.weight_scale": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.13.up_proj.weight": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.13.up_proj.weight_scale": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.130.down_proj.weight": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.130.down_proj.weight_scale": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.130.gate_proj.weight": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.130.gate_proj.weight_scale": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.130.up_proj.weight": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.130.up_proj.weight_scale": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.131.down_proj.weight": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.131.down_proj.weight_scale": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.131.gate_proj.weight": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.131.gate_proj.weight_scale": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.131.up_proj.weight": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.131.up_proj.weight_scale": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.132.down_proj.weight": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.132.down_proj.weight_scale": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.132.gate_proj.weight": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.132.gate_proj.weight_scale": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.132.up_proj.weight": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.132.up_proj.weight_scale": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.133.down_proj.weight": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.133.down_proj.weight_scale": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.133.gate_proj.weight": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.133.gate_proj.weight_scale": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.133.up_proj.weight": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.133.up_proj.weight_scale": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.134.down_proj.weight": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.134.down_proj.weight_scale": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.134.gate_proj.weight": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.134.gate_proj.weight_scale": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.134.up_proj.weight": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.134.up_proj.weight_scale": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.135.down_proj.weight": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.135.down_proj.weight_scale": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.135.gate_proj.weight": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.135.gate_proj.weight_scale": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.135.up_proj.weight": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.135.up_proj.weight_scale": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.136.down_proj.weight": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.136.down_proj.weight_scale": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.136.gate_proj.weight": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.136.gate_proj.weight_scale": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.136.up_proj.weight": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.136.up_proj.weight_scale": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.137.down_proj.weight": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.137.down_proj.weight_scale": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.137.gate_proj.weight": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.137.gate_proj.weight_scale": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.137.up_proj.weight": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.137.up_proj.weight_scale": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.138.down_proj.weight": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.138.down_proj.weight_scale": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.138.gate_proj.weight": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.138.gate_proj.weight_scale": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.138.up_proj.weight": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.138.up_proj.weight_scale": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.139.down_proj.weight": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.139.down_proj.weight_scale": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.139.gate_proj.weight": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.139.gate_proj.weight_scale": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.139.up_proj.weight": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.139.up_proj.weight_scale": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.14.down_proj.weight": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.14.down_proj.weight_scale": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.14.gate_proj.weight": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.14.gate_proj.weight_scale": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.14.up_proj.weight": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.14.up_proj.weight_scale": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.140.down_proj.weight": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.140.down_proj.weight_scale": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.140.gate_proj.weight": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.140.gate_proj.weight_scale": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.140.up_proj.weight": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.140.up_proj.weight_scale": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.141.down_proj.weight": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.141.down_proj.weight_scale": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.141.gate_proj.weight": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.141.gate_proj.weight_scale": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.141.up_proj.weight": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.141.up_proj.weight_scale": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.142.down_proj.weight": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.142.down_proj.weight_scale": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.142.gate_proj.weight": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.142.gate_proj.weight_scale": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.142.up_proj.weight": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.142.up_proj.weight_scale": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.143.down_proj.weight": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.143.down_proj.weight_scale": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.143.gate_proj.weight": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.143.gate_proj.weight_scale": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.143.up_proj.weight": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.143.up_proj.weight_scale": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.144.down_proj.weight": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.144.down_proj.weight_scale": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.144.gate_proj.weight": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.144.gate_proj.weight_scale": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.144.up_proj.weight": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.144.up_proj.weight_scale": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.145.down_proj.weight": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.145.down_proj.weight_scale": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.145.gate_proj.weight": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.145.gate_proj.weight_scale": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.145.up_proj.weight": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.145.up_proj.weight_scale": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.146.down_proj.weight": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.146.down_proj.weight_scale": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.146.gate_proj.weight": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.146.gate_proj.weight_scale": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.146.up_proj.weight": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.146.up_proj.weight_scale": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.147.down_proj.weight": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.147.down_proj.weight_scale": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.147.gate_proj.weight": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.147.gate_proj.weight_scale": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.147.up_proj.weight": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.147.up_proj.weight_scale": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.148.down_proj.weight": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.148.down_proj.weight_scale": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.148.gate_proj.weight": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.148.gate_proj.weight_scale": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.148.up_proj.weight": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.148.up_proj.weight_scale": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.149.down_proj.weight": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.149.down_proj.weight_scale": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.149.gate_proj.weight": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.149.gate_proj.weight_scale": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.149.up_proj.weight": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.149.up_proj.weight_scale": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.15.down_proj.weight": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.15.down_proj.weight_scale": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.15.gate_proj.weight": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.15.gate_proj.weight_scale": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.15.up_proj.weight": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.15.up_proj.weight_scale": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.150.down_proj.weight": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.150.down_proj.weight_scale": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.150.gate_proj.weight": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.150.gate_proj.weight_scale": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.150.up_proj.weight": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.150.up_proj.weight_scale": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.151.down_proj.weight": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.151.down_proj.weight_scale": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.151.gate_proj.weight": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.151.gate_proj.weight_scale": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.151.up_proj.weight": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.151.up_proj.weight_scale": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.152.down_proj.weight": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.152.down_proj.weight_scale": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.152.gate_proj.weight": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.152.gate_proj.weight_scale": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.152.up_proj.weight": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.152.up_proj.weight_scale": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.153.down_proj.weight": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.153.down_proj.weight_scale": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.153.gate_proj.weight": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.153.gate_proj.weight_scale": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.153.up_proj.weight": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.153.up_proj.weight_scale": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.154.down_proj.weight": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.154.down_proj.weight_scale": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.154.gate_proj.weight": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.154.gate_proj.weight_scale": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.154.up_proj.weight": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.154.up_proj.weight_scale": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.155.down_proj.weight": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.155.down_proj.weight_scale": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.155.gate_proj.weight": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.155.gate_proj.weight_scale": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.155.up_proj.weight": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.155.up_proj.weight_scale": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.156.down_proj.weight": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.156.down_proj.weight_scale": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.156.gate_proj.weight": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.156.gate_proj.weight_scale": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.156.up_proj.weight": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.156.up_proj.weight_scale": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.157.down_proj.weight": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.157.down_proj.weight_scale": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.157.gate_proj.weight": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.157.gate_proj.weight_scale": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.157.up_proj.weight": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.157.up_proj.weight_scale": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.158.down_proj.weight": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.158.down_proj.weight_scale": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.158.gate_proj.weight": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.158.gate_proj.weight_scale": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.158.up_proj.weight": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.158.up_proj.weight_scale": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.159.down_proj.weight": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.159.down_proj.weight_scale": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.159.gate_proj.weight": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.159.gate_proj.weight_scale": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.159.up_proj.weight": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.159.up_proj.weight_scale": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.16.down_proj.weight": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.16.down_proj.weight_scale": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.16.gate_proj.weight": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.16.gate_proj.weight_scale": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.16.up_proj.weight": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.16.up_proj.weight_scale": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.17.down_proj.weight": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.17.down_proj.weight_scale": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.17.gate_proj.weight": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.17.gate_proj.weight_scale": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.17.up_proj.weight": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.17.up_proj.weight_scale": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.18.down_proj.weight": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.18.down_proj.weight_scale": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.18.gate_proj.weight": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.18.gate_proj.weight_scale": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.18.up_proj.weight": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.18.up_proj.weight_scale": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.19.down_proj.weight": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.19.down_proj.weight_scale": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.19.gate_proj.weight": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.19.gate_proj.weight_scale": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.19.up_proj.weight": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.19.up_proj.weight_scale": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.2.down_proj.weight": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.2.down_proj.weight_scale": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.2.gate_proj.weight": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.2.gate_proj.weight_scale": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.2.up_proj.weight": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.2.up_proj.weight_scale": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.20.down_proj.weight": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.20.down_proj.weight_scale": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.20.gate_proj.weight": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.20.gate_proj.weight_scale": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.20.up_proj.weight": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.20.up_proj.weight_scale": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.21.down_proj.weight": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.21.down_proj.weight_scale": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.21.gate_proj.weight": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.21.gate_proj.weight_scale": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.21.up_proj.weight": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.21.up_proj.weight_scale": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.22.down_proj.weight": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.22.down_proj.weight_scale": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.22.gate_proj.weight": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.22.gate_proj.weight_scale": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.22.up_proj.weight": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.22.up_proj.weight_scale": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.23.down_proj.weight": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.23.down_proj.weight_scale": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.23.gate_proj.weight": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.23.gate_proj.weight_scale": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.23.up_proj.weight": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.23.up_proj.weight_scale": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.24.down_proj.weight": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.24.down_proj.weight_scale": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.24.gate_proj.weight": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.24.gate_proj.weight_scale": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.24.up_proj.weight": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.24.up_proj.weight_scale": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.25.down_proj.weight": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.25.down_proj.weight_scale": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.25.gate_proj.weight": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.25.gate_proj.weight_scale": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.25.up_proj.weight": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.25.up_proj.weight_scale": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.26.down_proj.weight": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.26.down_proj.weight_scale": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.26.gate_proj.weight": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.26.gate_proj.weight_scale": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.26.up_proj.weight": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.26.up_proj.weight_scale": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.27.down_proj.weight": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.27.down_proj.weight_scale": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.27.gate_proj.weight": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.27.gate_proj.weight_scale": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.27.up_proj.weight": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.27.up_proj.weight_scale": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.28.down_proj.weight": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.28.down_proj.weight_scale": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.28.gate_proj.weight": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.28.gate_proj.weight_scale": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.28.up_proj.weight": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.28.up_proj.weight_scale": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.29.down_proj.weight": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.29.down_proj.weight_scale": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.29.gate_proj.weight": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.29.gate_proj.weight_scale": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.29.up_proj.weight": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.29.up_proj.weight_scale": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.3.down_proj.weight": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.3.down_proj.weight_scale": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.3.gate_proj.weight": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.3.gate_proj.weight_scale": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.3.up_proj.weight": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.3.up_proj.weight_scale": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.30.down_proj.weight": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.30.down_proj.weight_scale": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.30.gate_proj.weight": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.30.gate_proj.weight_scale": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.30.up_proj.weight": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.30.up_proj.weight_scale": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.31.down_proj.weight": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.31.down_proj.weight_scale": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.31.gate_proj.weight": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.31.gate_proj.weight_scale": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.31.up_proj.weight": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.31.up_proj.weight_scale": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.32.down_proj.weight": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.32.down_proj.weight_scale": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.32.gate_proj.weight": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.32.gate_proj.weight_scale": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.32.up_proj.weight": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.32.up_proj.weight_scale": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.33.down_proj.weight": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.33.down_proj.weight_scale": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.33.gate_proj.weight": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.33.gate_proj.weight_scale": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.33.up_proj.weight": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.33.up_proj.weight_scale": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.34.down_proj.weight": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.34.down_proj.weight_scale": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.34.gate_proj.weight": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.34.gate_proj.weight_scale": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.34.up_proj.weight": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.34.up_proj.weight_scale": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.35.down_proj.weight": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.35.down_proj.weight_scale": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.35.gate_proj.weight": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.35.gate_proj.weight_scale": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.35.up_proj.weight": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.35.up_proj.weight_scale": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.36.down_proj.weight": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.36.down_proj.weight_scale": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.36.gate_proj.weight": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.36.gate_proj.weight_scale": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.36.up_proj.weight": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.36.up_proj.weight_scale": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.37.down_proj.weight": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.37.down_proj.weight_scale": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.37.gate_proj.weight": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.37.gate_proj.weight_scale": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.37.up_proj.weight": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.37.up_proj.weight_scale": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.38.down_proj.weight": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.38.down_proj.weight_scale": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.38.gate_proj.weight": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.38.gate_proj.weight_scale": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.38.up_proj.weight": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.38.up_proj.weight_scale": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.39.down_proj.weight": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.39.down_proj.weight_scale": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.39.gate_proj.weight": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.39.gate_proj.weight_scale": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.39.up_proj.weight": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.39.up_proj.weight_scale": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.4.down_proj.weight": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.4.down_proj.weight_scale": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.4.gate_proj.weight": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.4.gate_proj.weight_scale": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.4.up_proj.weight": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.4.up_proj.weight_scale": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.40.down_proj.weight": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.40.down_proj.weight_scale": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.40.gate_proj.weight": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.40.gate_proj.weight_scale": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.40.up_proj.weight": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.40.up_proj.weight_scale": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.41.down_proj.weight": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.41.down_proj.weight_scale": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.41.gate_proj.weight": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.41.gate_proj.weight_scale": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.41.up_proj.weight": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.41.up_proj.weight_scale": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.42.down_proj.weight": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.42.down_proj.weight_scale": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.42.gate_proj.weight": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.42.gate_proj.weight_scale": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.42.up_proj.weight": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.42.up_proj.weight_scale": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.43.down_proj.weight": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.43.down_proj.weight_scale": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.43.gate_proj.weight": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.43.gate_proj.weight_scale": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.43.up_proj.weight": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.43.up_proj.weight_scale": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.44.down_proj.weight": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.44.down_proj.weight_scale": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.44.gate_proj.weight": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.44.gate_proj.weight_scale": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.44.up_proj.weight": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.44.up_proj.weight_scale": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.45.down_proj.weight": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.45.down_proj.weight_scale": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.45.gate_proj.weight": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.45.gate_proj.weight_scale": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.45.up_proj.weight": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.45.up_proj.weight_scale": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.46.down_proj.weight": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.46.down_proj.weight_scale": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.46.gate_proj.weight": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.46.gate_proj.weight_scale": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.46.up_proj.weight": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.46.up_proj.weight_scale": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.47.down_proj.weight": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.47.down_proj.weight_scale": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.47.gate_proj.weight": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.47.gate_proj.weight_scale": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.47.up_proj.weight": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.47.up_proj.weight_scale": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.48.down_proj.weight": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.48.down_proj.weight_scale": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.48.gate_proj.weight": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.48.gate_proj.weight_scale": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.48.up_proj.weight": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.48.up_proj.weight_scale": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.49.down_proj.weight": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.49.down_proj.weight_scale": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.49.gate_proj.weight": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.49.gate_proj.weight_scale": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.49.up_proj.weight": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.49.up_proj.weight_scale": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.5.down_proj.weight": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.5.down_proj.weight_scale": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.5.gate_proj.weight": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.5.gate_proj.weight_scale": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.5.up_proj.weight": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.5.up_proj.weight_scale": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.50.down_proj.weight": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.50.down_proj.weight_scale": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.50.gate_proj.weight": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.50.gate_proj.weight_scale": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.50.up_proj.weight": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.50.up_proj.weight_scale": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.51.down_proj.weight": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.51.down_proj.weight_scale": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.51.gate_proj.weight": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.51.gate_proj.weight_scale": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.51.up_proj.weight": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.51.up_proj.weight_scale": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.52.down_proj.weight": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.52.down_proj.weight_scale": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.52.gate_proj.weight": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.52.gate_proj.weight_scale": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.52.up_proj.weight": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.52.up_proj.weight_scale": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.53.down_proj.weight": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.53.down_proj.weight_scale": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.53.gate_proj.weight": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.53.gate_proj.weight_scale": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.53.up_proj.weight": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.53.up_proj.weight_scale": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.54.down_proj.weight": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.54.down_proj.weight_scale": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.54.gate_proj.weight": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.54.gate_proj.weight_scale": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.54.up_proj.weight": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.54.up_proj.weight_scale": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.55.down_proj.weight": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.55.down_proj.weight_scale": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.55.gate_proj.weight": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.55.gate_proj.weight_scale": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.55.up_proj.weight": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.55.up_proj.weight_scale": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.56.down_proj.weight": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.56.down_proj.weight_scale": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.56.gate_proj.weight": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.56.gate_proj.weight_scale": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.56.up_proj.weight": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.56.up_proj.weight_scale": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.57.down_proj.weight": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.57.down_proj.weight_scale": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.57.gate_proj.weight": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.57.gate_proj.weight_scale": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.57.up_proj.weight": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.57.up_proj.weight_scale": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.58.down_proj.weight": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.58.down_proj.weight_scale": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.58.gate_proj.weight": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.58.gate_proj.weight_scale": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.58.up_proj.weight": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.58.up_proj.weight_scale": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.59.down_proj.weight": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.59.down_proj.weight_scale": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.59.gate_proj.weight": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.59.gate_proj.weight_scale": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.59.up_proj.weight": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.59.up_proj.weight_scale": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.6.down_proj.weight": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.6.down_proj.weight_scale": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.6.gate_proj.weight": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.6.gate_proj.weight_scale": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.6.up_proj.weight": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.6.up_proj.weight_scale": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.60.down_proj.weight": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.60.down_proj.weight_scale": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.60.gate_proj.weight": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.60.gate_proj.weight_scale": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.60.up_proj.weight": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.60.up_proj.weight_scale": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.61.down_proj.weight": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.61.down_proj.weight_scale": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.61.gate_proj.weight": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.61.gate_proj.weight_scale": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.61.up_proj.weight": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.61.up_proj.weight_scale": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.62.down_proj.weight": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.62.down_proj.weight_scale": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.62.gate_proj.weight": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.62.gate_proj.weight_scale": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.62.up_proj.weight": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.62.up_proj.weight_scale": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.63.down_proj.weight": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.63.down_proj.weight_scale": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.63.gate_proj.weight": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.63.gate_proj.weight_scale": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.63.up_proj.weight": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.63.up_proj.weight_scale": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.64.down_proj.weight": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.64.down_proj.weight_scale": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.64.gate_proj.weight": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.64.gate_proj.weight_scale": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.64.up_proj.weight": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.64.up_proj.weight_scale": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.65.down_proj.weight": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.65.down_proj.weight_scale": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.65.gate_proj.weight": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.65.gate_proj.weight_scale": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.65.up_proj.weight": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.65.up_proj.weight_scale": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.66.down_proj.weight": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.66.down_proj.weight_scale": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.66.gate_proj.weight": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.66.gate_proj.weight_scale": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.66.up_proj.weight": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.66.up_proj.weight_scale": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.67.down_proj.weight": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.67.down_proj.weight_scale": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.67.gate_proj.weight": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.67.gate_proj.weight_scale": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.67.up_proj.weight": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.67.up_proj.weight_scale": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.68.down_proj.weight": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.68.down_proj.weight_scale": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.68.gate_proj.weight": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.68.gate_proj.weight_scale": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.68.up_proj.weight": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.68.up_proj.weight_scale": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.69.down_proj.weight": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.69.down_proj.weight_scale": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.69.gate_proj.weight": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.69.gate_proj.weight_scale": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.69.up_proj.weight": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.69.up_proj.weight_scale": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.7.down_proj.weight": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.7.down_proj.weight_scale": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.7.gate_proj.weight": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.7.gate_proj.weight_scale": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.7.up_proj.weight": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.7.up_proj.weight_scale": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.70.down_proj.weight": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.70.down_proj.weight_scale": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.70.gate_proj.weight": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.70.gate_proj.weight_scale": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.70.up_proj.weight": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.70.up_proj.weight_scale": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.71.down_proj.weight": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.71.down_proj.weight_scale": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.71.gate_proj.weight": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.71.gate_proj.weight_scale": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.71.up_proj.weight": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.71.up_proj.weight_scale": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.72.down_proj.weight": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.72.down_proj.weight_scale": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.72.gate_proj.weight": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.72.gate_proj.weight_scale": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.72.up_proj.weight": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.72.up_proj.weight_scale": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.73.down_proj.weight": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.73.down_proj.weight_scale": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.73.gate_proj.weight": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.73.gate_proj.weight_scale": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.73.up_proj.weight": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.73.up_proj.weight_scale": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.74.down_proj.weight": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.74.down_proj.weight_scale": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.74.gate_proj.weight": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.74.gate_proj.weight_scale": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.74.up_proj.weight": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.74.up_proj.weight_scale": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.75.down_proj.weight": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.75.down_proj.weight_scale": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.75.gate_proj.weight": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.75.gate_proj.weight_scale": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.75.up_proj.weight": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.75.up_proj.weight_scale": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.76.down_proj.weight": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.76.down_proj.weight_scale": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.76.gate_proj.weight": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.76.gate_proj.weight_scale": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.76.up_proj.weight": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.76.up_proj.weight_scale": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.77.down_proj.weight": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.77.down_proj.weight_scale": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.77.gate_proj.weight": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.77.gate_proj.weight_scale": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.77.up_proj.weight": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.77.up_proj.weight_scale": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.78.down_proj.weight": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.78.down_proj.weight_scale": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.78.gate_proj.weight": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.78.gate_proj.weight_scale": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.78.up_proj.weight": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.78.up_proj.weight_scale": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.79.down_proj.weight": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.79.down_proj.weight_scale": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.79.gate_proj.weight": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.79.gate_proj.weight_scale": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.79.up_proj.weight": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.79.up_proj.weight_scale": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.8.down_proj.weight": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.8.down_proj.weight_scale": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.8.gate_proj.weight": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.8.gate_proj.weight_scale": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.8.up_proj.weight": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.8.up_proj.weight_scale": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.80.down_proj.weight": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.80.down_proj.weight_scale": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.80.gate_proj.weight": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.80.gate_proj.weight_scale": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.80.up_proj.weight": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.80.up_proj.weight_scale": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.81.down_proj.weight": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.81.down_proj.weight_scale": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.81.gate_proj.weight": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.81.gate_proj.weight_scale": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.81.up_proj.weight": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.81.up_proj.weight_scale": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.82.down_proj.weight": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.82.down_proj.weight_scale": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.82.gate_proj.weight": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.82.gate_proj.weight_scale": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.82.up_proj.weight": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.82.up_proj.weight_scale": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.83.down_proj.weight": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.83.down_proj.weight_scale": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.83.gate_proj.weight": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.83.gate_proj.weight_scale": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.83.up_proj.weight": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.83.up_proj.weight_scale": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.84.down_proj.weight": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.84.down_proj.weight_scale": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.84.gate_proj.weight": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.84.gate_proj.weight_scale": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.84.up_proj.weight": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.84.up_proj.weight_scale": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.85.down_proj.weight": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.85.down_proj.weight_scale": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.85.gate_proj.weight": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.85.gate_proj.weight_scale": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.85.up_proj.weight": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.85.up_proj.weight_scale": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.86.down_proj.weight": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.86.down_proj.weight_scale": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.86.gate_proj.weight": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.86.gate_proj.weight_scale": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.86.up_proj.weight": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.86.up_proj.weight_scale": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.87.down_proj.weight": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.87.down_proj.weight_scale": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.87.gate_proj.weight": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.87.gate_proj.weight_scale": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.87.up_proj.weight": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.87.up_proj.weight_scale": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.88.down_proj.weight": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.88.down_proj.weight_scale": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.88.gate_proj.weight": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.88.gate_proj.weight_scale": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.88.up_proj.weight": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.88.up_proj.weight_scale": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.89.down_proj.weight": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.89.down_proj.weight_scale": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.89.gate_proj.weight": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.89.gate_proj.weight_scale": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.89.up_proj.weight": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.89.up_proj.weight_scale": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.9.down_proj.weight": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.9.down_proj.weight_scale": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.9.gate_proj.weight": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.9.gate_proj.weight_scale": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.9.up_proj.weight": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.9.up_proj.weight_scale": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.90.down_proj.weight": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.90.down_proj.weight_scale": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.90.gate_proj.weight": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.90.gate_proj.weight_scale": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.90.up_proj.weight": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.90.up_proj.weight_scale": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.91.down_proj.weight": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.91.down_proj.weight_scale": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.91.gate_proj.weight": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.91.gate_proj.weight_scale": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.91.up_proj.weight": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.91.up_proj.weight_scale": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.92.down_proj.weight": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.92.down_proj.weight_scale": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.92.gate_proj.weight": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.92.gate_proj.weight_scale": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.92.up_proj.weight": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.92.up_proj.weight_scale": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.93.down_proj.weight": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.93.down_proj.weight_scale": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.93.gate_proj.weight": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.93.gate_proj.weight_scale": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.93.up_proj.weight": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.93.up_proj.weight_scale": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.94.down_proj.weight": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.94.down_proj.weight_scale": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.94.gate_proj.weight": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.94.gate_proj.weight_scale": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.94.up_proj.weight": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.94.up_proj.weight_scale": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.95.down_proj.weight": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.95.down_proj.weight_scale": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.95.gate_proj.weight": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.95.gate_proj.weight_scale": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.95.up_proj.weight": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.95.up_proj.weight_scale": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.96.down_proj.weight": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.96.down_proj.weight_scale": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.96.gate_proj.weight": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.96.gate_proj.weight_scale": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.96.up_proj.weight": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.96.up_proj.weight_scale": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.97.down_proj.weight": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.97.down_proj.weight_scale": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.97.gate_proj.weight": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.97.gate_proj.weight_scale": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.97.up_proj.weight": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.97.up_proj.weight_scale": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.98.down_proj.weight": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.98.down_proj.weight_scale": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.98.gate_proj.weight": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.98.gate_proj.weight_scale": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.98.up_proj.weight": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.98.up_proj.weight_scale": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.99.down_proj.weight": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.99.down_proj.weight_scale": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.99.gate_proj.weight": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.99.gate_proj.weight_scale": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.99.up_proj.weight": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.99.up_proj.weight_scale": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.gate.e_score_correction_bias": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.gate.weight": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.shared_experts.down_proj.weight": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.shared_experts.down_proj.weight_scale": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.shared_experts.gate_proj.weight": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.shared_experts.gate_proj.weight_scale": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.shared_experts.up_proj.weight": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.shared_experts.up_proj.weight_scale": "model-00062-of-00092.safetensors",
+ "model.layers.61.post_attention_layernorm.weight": "model-00062-of-00092.safetensors",
+ "model.layers.61.self_attn.k_norm.weight": "model-00062-of-00092.safetensors",
+ "model.layers.61.self_attn.k_proj.bias": "model-00062-of-00092.safetensors",
+ "model.layers.61.self_attn.k_proj.weight": "model-00062-of-00092.safetensors",
+ "model.layers.61.self_attn.k_proj.weight_scale": "model-00062-of-00092.safetensors",
+ "model.layers.61.self_attn.o_proj.weight": "model-00062-of-00092.safetensors",
+ "model.layers.61.self_attn.o_proj.weight_scale": "model-00062-of-00092.safetensors",
+ "model.layers.61.self_attn.q_norm.weight": "model-00062-of-00092.safetensors",
+ "model.layers.61.self_attn.q_proj.bias": "model-00062-of-00092.safetensors",
+ "model.layers.61.self_attn.q_proj.weight": "model-00062-of-00092.safetensors",
+ "model.layers.61.self_attn.q_proj.weight_scale": "model-00062-of-00092.safetensors",
+ "model.layers.61.self_attn.v_proj.bias": "model-00062-of-00092.safetensors",
+ "model.layers.61.self_attn.v_proj.weight": "model-00062-of-00092.safetensors",
+ "model.layers.61.self_attn.v_proj.weight_scale": "model-00062-of-00092.safetensors",
+ "model.layers.62.input_layernorm.weight": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.0.down_proj.weight": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.0.down_proj.weight_scale": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.0.gate_proj.weight": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.0.gate_proj.weight_scale": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.0.up_proj.weight": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.0.up_proj.weight_scale": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.1.down_proj.weight": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.1.down_proj.weight_scale": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.1.gate_proj.weight": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.1.gate_proj.weight_scale": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.1.up_proj.weight": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.1.up_proj.weight_scale": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.10.down_proj.weight": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.10.down_proj.weight_scale": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.10.gate_proj.weight": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.10.gate_proj.weight_scale": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.10.up_proj.weight": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.10.up_proj.weight_scale": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.100.down_proj.weight": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.100.down_proj.weight_scale": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.100.gate_proj.weight": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.100.gate_proj.weight_scale": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.100.up_proj.weight": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.100.up_proj.weight_scale": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.101.down_proj.weight": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.101.down_proj.weight_scale": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.101.gate_proj.weight": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.101.gate_proj.weight_scale": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.101.up_proj.weight": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.101.up_proj.weight_scale": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.102.down_proj.weight": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.102.down_proj.weight_scale": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.102.gate_proj.weight": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.102.gate_proj.weight_scale": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.102.up_proj.weight": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.102.up_proj.weight_scale": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.103.down_proj.weight": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.103.down_proj.weight_scale": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.103.gate_proj.weight": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.103.gate_proj.weight_scale": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.103.up_proj.weight": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.103.up_proj.weight_scale": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.104.down_proj.weight": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.104.down_proj.weight_scale": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.104.gate_proj.weight": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.104.gate_proj.weight_scale": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.104.up_proj.weight": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.104.up_proj.weight_scale": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.105.down_proj.weight": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.105.down_proj.weight_scale": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.105.gate_proj.weight": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.105.gate_proj.weight_scale": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.105.up_proj.weight": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.105.up_proj.weight_scale": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.106.down_proj.weight": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.106.down_proj.weight_scale": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.106.gate_proj.weight": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.106.gate_proj.weight_scale": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.106.up_proj.weight": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.106.up_proj.weight_scale": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.107.down_proj.weight": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.107.down_proj.weight_scale": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.107.gate_proj.weight": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.107.gate_proj.weight_scale": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.107.up_proj.weight": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.107.up_proj.weight_scale": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.108.down_proj.weight": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.108.down_proj.weight_scale": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.108.gate_proj.weight": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.108.gate_proj.weight_scale": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.108.up_proj.weight": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.108.up_proj.weight_scale": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.109.down_proj.weight": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.109.down_proj.weight_scale": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.109.gate_proj.weight": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.109.gate_proj.weight_scale": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.109.up_proj.weight": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.109.up_proj.weight_scale": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.11.down_proj.weight": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.11.down_proj.weight_scale": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.11.gate_proj.weight": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.11.gate_proj.weight_scale": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.11.up_proj.weight": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.11.up_proj.weight_scale": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.110.down_proj.weight": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.110.down_proj.weight_scale": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.110.gate_proj.weight": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.110.gate_proj.weight_scale": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.110.up_proj.weight": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.110.up_proj.weight_scale": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.111.down_proj.weight": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.111.down_proj.weight_scale": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.111.gate_proj.weight": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.111.gate_proj.weight_scale": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.111.up_proj.weight": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.111.up_proj.weight_scale": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.112.down_proj.weight": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.112.down_proj.weight_scale": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.112.gate_proj.weight": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.112.gate_proj.weight_scale": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.112.up_proj.weight": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.112.up_proj.weight_scale": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.113.down_proj.weight": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.113.down_proj.weight_scale": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.113.gate_proj.weight": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.113.gate_proj.weight_scale": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.113.up_proj.weight": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.113.up_proj.weight_scale": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.114.down_proj.weight": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.114.down_proj.weight_scale": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.114.gate_proj.weight": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.114.gate_proj.weight_scale": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.114.up_proj.weight": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.114.up_proj.weight_scale": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.115.down_proj.weight": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.115.down_proj.weight_scale": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.115.gate_proj.weight": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.115.gate_proj.weight_scale": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.115.up_proj.weight": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.115.up_proj.weight_scale": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.116.down_proj.weight": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.116.down_proj.weight_scale": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.116.gate_proj.weight": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.116.gate_proj.weight_scale": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.116.up_proj.weight": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.116.up_proj.weight_scale": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.117.down_proj.weight": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.117.down_proj.weight_scale": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.117.gate_proj.weight": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.117.gate_proj.weight_scale": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.117.up_proj.weight": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.117.up_proj.weight_scale": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.118.down_proj.weight": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.118.down_proj.weight_scale": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.118.gate_proj.weight": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.118.gate_proj.weight_scale": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.118.up_proj.weight": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.118.up_proj.weight_scale": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.119.down_proj.weight": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.119.down_proj.weight_scale": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.119.gate_proj.weight": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.119.gate_proj.weight_scale": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.119.up_proj.weight": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.119.up_proj.weight_scale": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.12.down_proj.weight": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.12.down_proj.weight_scale": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.12.gate_proj.weight": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.12.gate_proj.weight_scale": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.12.up_proj.weight": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.12.up_proj.weight_scale": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.120.down_proj.weight": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.120.down_proj.weight_scale": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.120.gate_proj.weight": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.120.gate_proj.weight_scale": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.120.up_proj.weight": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.120.up_proj.weight_scale": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.121.down_proj.weight": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.121.down_proj.weight_scale": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.121.gate_proj.weight": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.121.gate_proj.weight_scale": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.121.up_proj.weight": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.121.up_proj.weight_scale": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.122.down_proj.weight": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.122.down_proj.weight_scale": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.122.gate_proj.weight": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.122.gate_proj.weight_scale": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.122.up_proj.weight": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.122.up_proj.weight_scale": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.123.down_proj.weight": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.123.down_proj.weight_scale": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.123.gate_proj.weight": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.123.gate_proj.weight_scale": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.123.up_proj.weight": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.123.up_proj.weight_scale": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.124.down_proj.weight": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.124.down_proj.weight_scale": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.124.gate_proj.weight": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.124.gate_proj.weight_scale": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.124.up_proj.weight": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.124.up_proj.weight_scale": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.125.down_proj.weight": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.125.down_proj.weight_scale": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.125.gate_proj.weight": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.125.gate_proj.weight_scale": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.125.up_proj.weight": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.125.up_proj.weight_scale": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.126.down_proj.weight": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.126.down_proj.weight_scale": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.126.gate_proj.weight": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.126.gate_proj.weight_scale": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.126.up_proj.weight": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.126.up_proj.weight_scale": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.127.down_proj.weight": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.127.down_proj.weight_scale": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.127.gate_proj.weight": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.127.gate_proj.weight_scale": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.127.up_proj.weight": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.127.up_proj.weight_scale": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.128.down_proj.weight": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.128.down_proj.weight_scale": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.128.gate_proj.weight": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.128.gate_proj.weight_scale": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.128.up_proj.weight": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.128.up_proj.weight_scale": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.129.down_proj.weight": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.129.down_proj.weight_scale": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.129.gate_proj.weight": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.129.gate_proj.weight_scale": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.129.up_proj.weight": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.129.up_proj.weight_scale": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.13.down_proj.weight": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.13.down_proj.weight_scale": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.13.gate_proj.weight": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.13.gate_proj.weight_scale": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.13.up_proj.weight": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.13.up_proj.weight_scale": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.130.down_proj.weight": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.130.down_proj.weight_scale": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.130.gate_proj.weight": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.130.gate_proj.weight_scale": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.130.up_proj.weight": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.130.up_proj.weight_scale": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.131.down_proj.weight": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.131.down_proj.weight_scale": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.131.gate_proj.weight": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.131.gate_proj.weight_scale": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.131.up_proj.weight": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.131.up_proj.weight_scale": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.132.down_proj.weight": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.132.down_proj.weight_scale": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.132.gate_proj.weight": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.132.gate_proj.weight_scale": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.132.up_proj.weight": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.132.up_proj.weight_scale": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.133.down_proj.weight": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.133.down_proj.weight_scale": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.133.gate_proj.weight": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.133.gate_proj.weight_scale": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.133.up_proj.weight": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.133.up_proj.weight_scale": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.134.down_proj.weight": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.134.down_proj.weight_scale": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.134.gate_proj.weight": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.134.gate_proj.weight_scale": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.134.up_proj.weight": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.134.up_proj.weight_scale": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.135.down_proj.weight": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.135.down_proj.weight_scale": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.135.gate_proj.weight": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.135.gate_proj.weight_scale": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.135.up_proj.weight": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.135.up_proj.weight_scale": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.136.down_proj.weight": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.136.down_proj.weight_scale": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.136.gate_proj.weight": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.136.gate_proj.weight_scale": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.136.up_proj.weight": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.136.up_proj.weight_scale": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.137.down_proj.weight": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.137.down_proj.weight_scale": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.137.gate_proj.weight": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.137.gate_proj.weight_scale": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.137.up_proj.weight": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.137.up_proj.weight_scale": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.138.down_proj.weight": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.138.down_proj.weight_scale": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.138.gate_proj.weight": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.138.gate_proj.weight_scale": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.138.up_proj.weight": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.138.up_proj.weight_scale": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.139.down_proj.weight": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.139.down_proj.weight_scale": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.139.gate_proj.weight": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.139.gate_proj.weight_scale": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.139.up_proj.weight": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.139.up_proj.weight_scale": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.14.down_proj.weight": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.14.down_proj.weight_scale": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.14.gate_proj.weight": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.14.gate_proj.weight_scale": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.14.up_proj.weight": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.14.up_proj.weight_scale": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.140.down_proj.weight": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.140.down_proj.weight_scale": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.140.gate_proj.weight": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.140.gate_proj.weight_scale": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.140.up_proj.weight": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.140.up_proj.weight_scale": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.141.down_proj.weight": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.141.down_proj.weight_scale": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.141.gate_proj.weight": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.141.gate_proj.weight_scale": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.141.up_proj.weight": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.141.up_proj.weight_scale": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.142.down_proj.weight": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.142.down_proj.weight_scale": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.142.gate_proj.weight": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.142.gate_proj.weight_scale": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.142.up_proj.weight": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.142.up_proj.weight_scale": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.143.down_proj.weight": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.143.down_proj.weight_scale": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.143.gate_proj.weight": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.143.gate_proj.weight_scale": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.143.up_proj.weight": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.143.up_proj.weight_scale": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.144.down_proj.weight": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.144.down_proj.weight_scale": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.144.gate_proj.weight": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.144.gate_proj.weight_scale": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.144.up_proj.weight": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.144.up_proj.weight_scale": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.145.down_proj.weight": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.145.down_proj.weight_scale": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.145.gate_proj.weight": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.145.gate_proj.weight_scale": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.145.up_proj.weight": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.145.up_proj.weight_scale": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.146.down_proj.weight": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.146.down_proj.weight_scale": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.146.gate_proj.weight": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.146.gate_proj.weight_scale": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.146.up_proj.weight": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.146.up_proj.weight_scale": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.147.down_proj.weight": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.147.down_proj.weight_scale": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.147.gate_proj.weight": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.147.gate_proj.weight_scale": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.147.up_proj.weight": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.147.up_proj.weight_scale": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.148.down_proj.weight": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.148.down_proj.weight_scale": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.148.gate_proj.weight": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.148.gate_proj.weight_scale": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.148.up_proj.weight": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.148.up_proj.weight_scale": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.149.down_proj.weight": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.149.down_proj.weight_scale": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.149.gate_proj.weight": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.149.gate_proj.weight_scale": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.149.up_proj.weight": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.149.up_proj.weight_scale": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.15.down_proj.weight": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.15.down_proj.weight_scale": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.15.gate_proj.weight": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.15.gate_proj.weight_scale": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.15.up_proj.weight": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.15.up_proj.weight_scale": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.150.down_proj.weight": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.150.down_proj.weight_scale": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.150.gate_proj.weight": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.150.gate_proj.weight_scale": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.150.up_proj.weight": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.150.up_proj.weight_scale": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.151.down_proj.weight": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.151.down_proj.weight_scale": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.151.gate_proj.weight": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.151.gate_proj.weight_scale": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.151.up_proj.weight": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.151.up_proj.weight_scale": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.152.down_proj.weight": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.152.down_proj.weight_scale": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.152.gate_proj.weight": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.152.gate_proj.weight_scale": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.152.up_proj.weight": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.152.up_proj.weight_scale": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.153.down_proj.weight": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.153.down_proj.weight_scale": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.153.gate_proj.weight": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.153.gate_proj.weight_scale": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.153.up_proj.weight": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.153.up_proj.weight_scale": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.154.down_proj.weight": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.154.down_proj.weight_scale": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.154.gate_proj.weight": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.154.gate_proj.weight_scale": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.154.up_proj.weight": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.154.up_proj.weight_scale": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.155.down_proj.weight": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.155.down_proj.weight_scale": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.155.gate_proj.weight": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.155.gate_proj.weight_scale": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.155.up_proj.weight": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.155.up_proj.weight_scale": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.156.down_proj.weight": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.156.down_proj.weight_scale": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.156.gate_proj.weight": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.156.gate_proj.weight_scale": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.156.up_proj.weight": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.156.up_proj.weight_scale": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.157.down_proj.weight": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.157.down_proj.weight_scale": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.157.gate_proj.weight": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.157.gate_proj.weight_scale": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.157.up_proj.weight": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.157.up_proj.weight_scale": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.158.down_proj.weight": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.158.down_proj.weight_scale": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.158.gate_proj.weight": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.158.gate_proj.weight_scale": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.158.up_proj.weight": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.158.up_proj.weight_scale": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.159.down_proj.weight": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.159.down_proj.weight_scale": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.159.gate_proj.weight": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.159.gate_proj.weight_scale": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.159.up_proj.weight": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.159.up_proj.weight_scale": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.16.down_proj.weight": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.16.down_proj.weight_scale": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.16.gate_proj.weight": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.16.gate_proj.weight_scale": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.16.up_proj.weight": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.16.up_proj.weight_scale": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.17.down_proj.weight": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.17.down_proj.weight_scale": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.17.gate_proj.weight": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.17.gate_proj.weight_scale": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.17.up_proj.weight": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.17.up_proj.weight_scale": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.18.down_proj.weight": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.18.down_proj.weight_scale": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.18.gate_proj.weight": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.18.gate_proj.weight_scale": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.18.up_proj.weight": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.18.up_proj.weight_scale": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.19.down_proj.weight": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.19.down_proj.weight_scale": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.19.gate_proj.weight": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.19.gate_proj.weight_scale": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.19.up_proj.weight": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.19.up_proj.weight_scale": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.2.down_proj.weight": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.2.down_proj.weight_scale": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.2.gate_proj.weight": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.2.gate_proj.weight_scale": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.2.up_proj.weight": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.2.up_proj.weight_scale": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.20.down_proj.weight": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.20.down_proj.weight_scale": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.20.gate_proj.weight": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.20.gate_proj.weight_scale": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.20.up_proj.weight": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.20.up_proj.weight_scale": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.21.down_proj.weight": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.21.down_proj.weight_scale": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.21.gate_proj.weight": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.21.gate_proj.weight_scale": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.21.up_proj.weight": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.21.up_proj.weight_scale": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.22.down_proj.weight": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.22.down_proj.weight_scale": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.22.gate_proj.weight": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.22.gate_proj.weight_scale": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.22.up_proj.weight": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.22.up_proj.weight_scale": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.23.down_proj.weight": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.23.down_proj.weight_scale": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.23.gate_proj.weight": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.23.gate_proj.weight_scale": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.23.up_proj.weight": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.23.up_proj.weight_scale": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.24.down_proj.weight": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.24.down_proj.weight_scale": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.24.gate_proj.weight": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.24.gate_proj.weight_scale": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.24.up_proj.weight": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.24.up_proj.weight_scale": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.25.down_proj.weight": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.25.down_proj.weight_scale": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.25.gate_proj.weight": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.25.gate_proj.weight_scale": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.25.up_proj.weight": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.25.up_proj.weight_scale": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.26.down_proj.weight": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.26.down_proj.weight_scale": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.26.gate_proj.weight": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.26.gate_proj.weight_scale": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.26.up_proj.weight": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.26.up_proj.weight_scale": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.27.down_proj.weight": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.27.down_proj.weight_scale": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.27.gate_proj.weight": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.27.gate_proj.weight_scale": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.27.up_proj.weight": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.27.up_proj.weight_scale": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.28.down_proj.weight": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.28.down_proj.weight_scale": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.28.gate_proj.weight": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.28.gate_proj.weight_scale": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.28.up_proj.weight": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.28.up_proj.weight_scale": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.29.down_proj.weight": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.29.down_proj.weight_scale": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.29.gate_proj.weight": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.29.gate_proj.weight_scale": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.29.up_proj.weight": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.29.up_proj.weight_scale": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.3.down_proj.weight": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.3.down_proj.weight_scale": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.3.gate_proj.weight": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.3.gate_proj.weight_scale": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.3.up_proj.weight": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.3.up_proj.weight_scale": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.30.down_proj.weight": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.30.down_proj.weight_scale": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.30.gate_proj.weight": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.30.gate_proj.weight_scale": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.30.up_proj.weight": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.30.up_proj.weight_scale": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.31.down_proj.weight": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.31.down_proj.weight_scale": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.31.gate_proj.weight": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.31.gate_proj.weight_scale": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.31.up_proj.weight": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.31.up_proj.weight_scale": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.32.down_proj.weight": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.32.down_proj.weight_scale": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.32.gate_proj.weight": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.32.gate_proj.weight_scale": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.32.up_proj.weight": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.32.up_proj.weight_scale": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.33.down_proj.weight": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.33.down_proj.weight_scale": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.33.gate_proj.weight": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.33.gate_proj.weight_scale": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.33.up_proj.weight": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.33.up_proj.weight_scale": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.34.down_proj.weight": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.34.down_proj.weight_scale": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.34.gate_proj.weight": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.34.gate_proj.weight_scale": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.34.up_proj.weight": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.34.up_proj.weight_scale": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.35.down_proj.weight": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.35.down_proj.weight_scale": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.35.gate_proj.weight": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.35.gate_proj.weight_scale": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.35.up_proj.weight": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.35.up_proj.weight_scale": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.36.down_proj.weight": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.36.down_proj.weight_scale": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.36.gate_proj.weight": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.36.gate_proj.weight_scale": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.36.up_proj.weight": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.36.up_proj.weight_scale": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.37.down_proj.weight": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.37.down_proj.weight_scale": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.37.gate_proj.weight": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.37.gate_proj.weight_scale": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.37.up_proj.weight": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.37.up_proj.weight_scale": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.38.down_proj.weight": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.38.down_proj.weight_scale": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.38.gate_proj.weight": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.38.gate_proj.weight_scale": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.38.up_proj.weight": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.38.up_proj.weight_scale": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.39.down_proj.weight": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.39.down_proj.weight_scale": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.39.gate_proj.weight": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.39.gate_proj.weight_scale": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.39.up_proj.weight": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.39.up_proj.weight_scale": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.4.down_proj.weight": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.4.down_proj.weight_scale": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.4.gate_proj.weight": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.4.gate_proj.weight_scale": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.4.up_proj.weight": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.4.up_proj.weight_scale": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.40.down_proj.weight": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.40.down_proj.weight_scale": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.40.gate_proj.weight": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.40.gate_proj.weight_scale": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.40.up_proj.weight": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.40.up_proj.weight_scale": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.41.down_proj.weight": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.41.down_proj.weight_scale": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.41.gate_proj.weight": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.41.gate_proj.weight_scale": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.41.up_proj.weight": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.41.up_proj.weight_scale": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.42.down_proj.weight": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.42.down_proj.weight_scale": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.42.gate_proj.weight": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.42.gate_proj.weight_scale": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.42.up_proj.weight": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.42.up_proj.weight_scale": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.43.down_proj.weight": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.43.down_proj.weight_scale": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.43.gate_proj.weight": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.43.gate_proj.weight_scale": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.43.up_proj.weight": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.43.up_proj.weight_scale": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.44.down_proj.weight": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.44.down_proj.weight_scale": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.44.gate_proj.weight": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.44.gate_proj.weight_scale": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.44.up_proj.weight": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.44.up_proj.weight_scale": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.45.down_proj.weight": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.45.down_proj.weight_scale": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.45.gate_proj.weight": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.45.gate_proj.weight_scale": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.45.up_proj.weight": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.45.up_proj.weight_scale": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.46.down_proj.weight": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.46.down_proj.weight_scale": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.46.gate_proj.weight": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.46.gate_proj.weight_scale": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.46.up_proj.weight": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.46.up_proj.weight_scale": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.47.down_proj.weight": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.47.down_proj.weight_scale": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.47.gate_proj.weight": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.47.gate_proj.weight_scale": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.47.up_proj.weight": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.47.up_proj.weight_scale": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.48.down_proj.weight": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.48.down_proj.weight_scale": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.48.gate_proj.weight": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.48.gate_proj.weight_scale": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.48.up_proj.weight": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.48.up_proj.weight_scale": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.49.down_proj.weight": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.49.down_proj.weight_scale": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.49.gate_proj.weight": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.49.gate_proj.weight_scale": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.49.up_proj.weight": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.49.up_proj.weight_scale": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.5.down_proj.weight": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.5.down_proj.weight_scale": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.5.gate_proj.weight": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.5.gate_proj.weight_scale": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.5.up_proj.weight": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.5.up_proj.weight_scale": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.50.down_proj.weight": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.50.down_proj.weight_scale": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.50.gate_proj.weight": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.50.gate_proj.weight_scale": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.50.up_proj.weight": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.50.up_proj.weight_scale": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.51.down_proj.weight": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.51.down_proj.weight_scale": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.51.gate_proj.weight": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.51.gate_proj.weight_scale": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.51.up_proj.weight": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.51.up_proj.weight_scale": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.52.down_proj.weight": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.52.down_proj.weight_scale": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.52.gate_proj.weight": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.52.gate_proj.weight_scale": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.52.up_proj.weight": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.52.up_proj.weight_scale": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.53.down_proj.weight": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.53.down_proj.weight_scale": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.53.gate_proj.weight": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.53.gate_proj.weight_scale": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.53.up_proj.weight": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.53.up_proj.weight_scale": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.54.down_proj.weight": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.54.down_proj.weight_scale": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.54.gate_proj.weight": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.54.gate_proj.weight_scale": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.54.up_proj.weight": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.54.up_proj.weight_scale": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.55.down_proj.weight": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.55.down_proj.weight_scale": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.55.gate_proj.weight": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.55.gate_proj.weight_scale": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.55.up_proj.weight": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.55.up_proj.weight_scale": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.56.down_proj.weight": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.56.down_proj.weight_scale": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.56.gate_proj.weight": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.56.gate_proj.weight_scale": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.56.up_proj.weight": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.56.up_proj.weight_scale": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.57.down_proj.weight": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.57.down_proj.weight_scale": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.57.gate_proj.weight": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.57.gate_proj.weight_scale": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.57.up_proj.weight": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.57.up_proj.weight_scale": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.58.down_proj.weight": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.58.down_proj.weight_scale": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.58.gate_proj.weight": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.58.gate_proj.weight_scale": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.58.up_proj.weight": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.58.up_proj.weight_scale": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.59.down_proj.weight": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.59.down_proj.weight_scale": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.59.gate_proj.weight": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.59.gate_proj.weight_scale": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.59.up_proj.weight": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.59.up_proj.weight_scale": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.6.down_proj.weight": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.6.down_proj.weight_scale": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.6.gate_proj.weight": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.6.gate_proj.weight_scale": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.6.up_proj.weight": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.6.up_proj.weight_scale": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.60.down_proj.weight": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.60.down_proj.weight_scale": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.60.gate_proj.weight": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.60.gate_proj.weight_scale": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.60.up_proj.weight": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.60.up_proj.weight_scale": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.61.down_proj.weight": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.61.down_proj.weight_scale": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.61.gate_proj.weight": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.61.gate_proj.weight_scale": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.61.up_proj.weight": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.61.up_proj.weight_scale": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.62.down_proj.weight": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.62.down_proj.weight_scale": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.62.gate_proj.weight": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.62.gate_proj.weight_scale": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.62.up_proj.weight": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.62.up_proj.weight_scale": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.63.down_proj.weight": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.63.down_proj.weight_scale": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.63.gate_proj.weight": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.63.gate_proj.weight_scale": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.63.up_proj.weight": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.63.up_proj.weight_scale": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.64.down_proj.weight": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.64.down_proj.weight_scale": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.64.gate_proj.weight": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.64.gate_proj.weight_scale": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.64.up_proj.weight": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.64.up_proj.weight_scale": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.65.down_proj.weight": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.65.down_proj.weight_scale": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.65.gate_proj.weight": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.65.gate_proj.weight_scale": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.65.up_proj.weight": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.65.up_proj.weight_scale": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.66.down_proj.weight": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.66.down_proj.weight_scale": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.66.gate_proj.weight": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.66.gate_proj.weight_scale": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.66.up_proj.weight": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.66.up_proj.weight_scale": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.67.down_proj.weight": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.67.down_proj.weight_scale": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.67.gate_proj.weight": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.67.gate_proj.weight_scale": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.67.up_proj.weight": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.67.up_proj.weight_scale": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.68.down_proj.weight": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.68.down_proj.weight_scale": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.68.gate_proj.weight": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.68.gate_proj.weight_scale": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.68.up_proj.weight": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.68.up_proj.weight_scale": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.69.down_proj.weight": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.69.down_proj.weight_scale": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.69.gate_proj.weight": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.69.gate_proj.weight_scale": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.69.up_proj.weight": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.69.up_proj.weight_scale": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.7.down_proj.weight": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.7.down_proj.weight_scale": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.7.gate_proj.weight": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.7.gate_proj.weight_scale": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.7.up_proj.weight": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.7.up_proj.weight_scale": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.70.down_proj.weight": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.70.down_proj.weight_scale": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.70.gate_proj.weight": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.70.gate_proj.weight_scale": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.70.up_proj.weight": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.70.up_proj.weight_scale": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.71.down_proj.weight": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.71.down_proj.weight_scale": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.71.gate_proj.weight": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.71.gate_proj.weight_scale": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.71.up_proj.weight": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.71.up_proj.weight_scale": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.72.down_proj.weight": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.72.down_proj.weight_scale": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.72.gate_proj.weight": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.72.gate_proj.weight_scale": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.72.up_proj.weight": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.72.up_proj.weight_scale": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.73.down_proj.weight": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.73.down_proj.weight_scale": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.73.gate_proj.weight": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.73.gate_proj.weight_scale": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.73.up_proj.weight": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.73.up_proj.weight_scale": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.74.down_proj.weight": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.74.down_proj.weight_scale": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.74.gate_proj.weight": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.74.gate_proj.weight_scale": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.74.up_proj.weight": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.74.up_proj.weight_scale": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.75.down_proj.weight": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.75.down_proj.weight_scale": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.75.gate_proj.weight": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.75.gate_proj.weight_scale": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.75.up_proj.weight": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.75.up_proj.weight_scale": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.76.down_proj.weight": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.76.down_proj.weight_scale": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.76.gate_proj.weight": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.76.gate_proj.weight_scale": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.76.up_proj.weight": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.76.up_proj.weight_scale": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.77.down_proj.weight": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.77.down_proj.weight_scale": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.77.gate_proj.weight": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.77.gate_proj.weight_scale": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.77.up_proj.weight": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.77.up_proj.weight_scale": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.78.down_proj.weight": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.78.down_proj.weight_scale": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.78.gate_proj.weight": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.78.gate_proj.weight_scale": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.78.up_proj.weight": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.78.up_proj.weight_scale": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.79.down_proj.weight": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.79.down_proj.weight_scale": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.79.gate_proj.weight": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.79.gate_proj.weight_scale": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.79.up_proj.weight": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.79.up_proj.weight_scale": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.8.down_proj.weight": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.8.down_proj.weight_scale": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.8.gate_proj.weight": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.8.gate_proj.weight_scale": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.8.up_proj.weight": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.8.up_proj.weight_scale": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.80.down_proj.weight": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.80.down_proj.weight_scale": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.80.gate_proj.weight": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.80.gate_proj.weight_scale": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.80.up_proj.weight": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.80.up_proj.weight_scale": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.81.down_proj.weight": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.81.down_proj.weight_scale": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.81.gate_proj.weight": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.81.gate_proj.weight_scale": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.81.up_proj.weight": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.81.up_proj.weight_scale": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.82.down_proj.weight": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.82.down_proj.weight_scale": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.82.gate_proj.weight": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.82.gate_proj.weight_scale": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.82.up_proj.weight": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.82.up_proj.weight_scale": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.83.down_proj.weight": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.83.down_proj.weight_scale": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.83.gate_proj.weight": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.83.gate_proj.weight_scale": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.83.up_proj.weight": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.83.up_proj.weight_scale": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.84.down_proj.weight": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.84.down_proj.weight_scale": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.84.gate_proj.weight": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.84.gate_proj.weight_scale": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.84.up_proj.weight": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.84.up_proj.weight_scale": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.85.down_proj.weight": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.85.down_proj.weight_scale": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.85.gate_proj.weight": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.85.gate_proj.weight_scale": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.85.up_proj.weight": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.85.up_proj.weight_scale": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.86.down_proj.weight": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.86.down_proj.weight_scale": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.86.gate_proj.weight": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.86.gate_proj.weight_scale": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.86.up_proj.weight": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.86.up_proj.weight_scale": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.87.down_proj.weight": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.87.down_proj.weight_scale": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.87.gate_proj.weight": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.87.gate_proj.weight_scale": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.87.up_proj.weight": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.87.up_proj.weight_scale": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.88.down_proj.weight": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.88.down_proj.weight_scale": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.88.gate_proj.weight": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.88.gate_proj.weight_scale": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.88.up_proj.weight": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.88.up_proj.weight_scale": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.89.down_proj.weight": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.89.down_proj.weight_scale": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.89.gate_proj.weight": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.89.gate_proj.weight_scale": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.89.up_proj.weight": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.89.up_proj.weight_scale": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.9.down_proj.weight": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.9.down_proj.weight_scale": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.9.gate_proj.weight": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.9.gate_proj.weight_scale": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.9.up_proj.weight": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.9.up_proj.weight_scale": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.90.down_proj.weight": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.90.down_proj.weight_scale": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.90.gate_proj.weight": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.90.gate_proj.weight_scale": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.90.up_proj.weight": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.90.up_proj.weight_scale": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.91.down_proj.weight": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.91.down_proj.weight_scale": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.91.gate_proj.weight": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.91.gate_proj.weight_scale": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.91.up_proj.weight": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.91.up_proj.weight_scale": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.92.down_proj.weight": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.92.down_proj.weight_scale": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.92.gate_proj.weight": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.92.gate_proj.weight_scale": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.92.up_proj.weight": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.92.up_proj.weight_scale": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.93.down_proj.weight": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.93.down_proj.weight_scale": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.93.gate_proj.weight": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.93.gate_proj.weight_scale": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.93.up_proj.weight": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.93.up_proj.weight_scale": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.94.down_proj.weight": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.94.down_proj.weight_scale": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.94.gate_proj.weight": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.94.gate_proj.weight_scale": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.94.up_proj.weight": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.94.up_proj.weight_scale": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.95.down_proj.weight": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.95.down_proj.weight_scale": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.95.gate_proj.weight": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.95.gate_proj.weight_scale": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.95.up_proj.weight": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.95.up_proj.weight_scale": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.96.down_proj.weight": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.96.down_proj.weight_scale": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.96.gate_proj.weight": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.96.gate_proj.weight_scale": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.96.up_proj.weight": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.96.up_proj.weight_scale": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.97.down_proj.weight": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.97.down_proj.weight_scale": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.97.gate_proj.weight": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.97.gate_proj.weight_scale": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.97.up_proj.weight": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.97.up_proj.weight_scale": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.98.down_proj.weight": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.98.down_proj.weight_scale": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.98.gate_proj.weight": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.98.gate_proj.weight_scale": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.98.up_proj.weight": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.98.up_proj.weight_scale": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.99.down_proj.weight": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.99.down_proj.weight_scale": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.99.gate_proj.weight": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.99.gate_proj.weight_scale": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.99.up_proj.weight": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.99.up_proj.weight_scale": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.gate.e_score_correction_bias": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.gate.weight": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.shared_experts.down_proj.weight": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.shared_experts.down_proj.weight_scale": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.shared_experts.gate_proj.weight": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.shared_experts.gate_proj.weight_scale": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.shared_experts.up_proj.weight": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.shared_experts.up_proj.weight_scale": "model-00063-of-00092.safetensors",
+ "model.layers.62.post_attention_layernorm.weight": "model-00063-of-00092.safetensors",
+ "model.layers.62.self_attn.k_norm.weight": "model-00063-of-00092.safetensors",
+ "model.layers.62.self_attn.k_proj.bias": "model-00063-of-00092.safetensors",
+ "model.layers.62.self_attn.k_proj.weight": "model-00063-of-00092.safetensors",
+ "model.layers.62.self_attn.k_proj.weight_scale": "model-00063-of-00092.safetensors",
+ "model.layers.62.self_attn.o_proj.weight": "model-00063-of-00092.safetensors",
+ "model.layers.62.self_attn.o_proj.weight_scale": "model-00063-of-00092.safetensors",
+ "model.layers.62.self_attn.q_norm.weight": "model-00063-of-00092.safetensors",
+ "model.layers.62.self_attn.q_proj.bias": "model-00063-of-00092.safetensors",
+ "model.layers.62.self_attn.q_proj.weight": "model-00063-of-00092.safetensors",
+ "model.layers.62.self_attn.q_proj.weight_scale": "model-00063-of-00092.safetensors",
+ "model.layers.62.self_attn.v_proj.bias": "model-00063-of-00092.safetensors",
+ "model.layers.62.self_attn.v_proj.weight": "model-00063-of-00092.safetensors",
+ "model.layers.62.self_attn.v_proj.weight_scale": "model-00063-of-00092.safetensors",
+ "model.layers.63.input_layernorm.weight": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.0.down_proj.weight": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.0.down_proj.weight_scale": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.0.gate_proj.weight": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.0.gate_proj.weight_scale": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.0.up_proj.weight": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.0.up_proj.weight_scale": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.1.down_proj.weight": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.1.down_proj.weight_scale": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.1.gate_proj.weight": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.1.gate_proj.weight_scale": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.1.up_proj.weight": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.1.up_proj.weight_scale": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.10.down_proj.weight": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.10.down_proj.weight_scale": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.10.gate_proj.weight": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.10.gate_proj.weight_scale": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.10.up_proj.weight": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.10.up_proj.weight_scale": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.100.down_proj.weight": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.100.down_proj.weight_scale": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.100.gate_proj.weight": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.100.gate_proj.weight_scale": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.100.up_proj.weight": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.100.up_proj.weight_scale": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.101.down_proj.weight": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.101.down_proj.weight_scale": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.101.gate_proj.weight": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.101.gate_proj.weight_scale": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.101.up_proj.weight": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.101.up_proj.weight_scale": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.102.down_proj.weight": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.102.down_proj.weight_scale": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.102.gate_proj.weight": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.102.gate_proj.weight_scale": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.102.up_proj.weight": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.102.up_proj.weight_scale": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.103.down_proj.weight": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.103.down_proj.weight_scale": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.103.gate_proj.weight": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.103.gate_proj.weight_scale": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.103.up_proj.weight": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.103.up_proj.weight_scale": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.104.down_proj.weight": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.104.down_proj.weight_scale": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.104.gate_proj.weight": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.104.gate_proj.weight_scale": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.104.up_proj.weight": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.104.up_proj.weight_scale": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.105.down_proj.weight": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.105.down_proj.weight_scale": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.105.gate_proj.weight": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.105.gate_proj.weight_scale": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.105.up_proj.weight": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.105.up_proj.weight_scale": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.106.down_proj.weight": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.106.down_proj.weight_scale": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.106.gate_proj.weight": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.106.gate_proj.weight_scale": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.106.up_proj.weight": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.106.up_proj.weight_scale": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.107.down_proj.weight": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.107.down_proj.weight_scale": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.107.gate_proj.weight": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.107.gate_proj.weight_scale": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.107.up_proj.weight": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.107.up_proj.weight_scale": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.108.down_proj.weight": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.108.down_proj.weight_scale": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.108.gate_proj.weight": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.108.gate_proj.weight_scale": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.108.up_proj.weight": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.108.up_proj.weight_scale": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.109.down_proj.weight": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.109.down_proj.weight_scale": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.109.gate_proj.weight": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.109.gate_proj.weight_scale": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.109.up_proj.weight": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.109.up_proj.weight_scale": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.11.down_proj.weight": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.11.down_proj.weight_scale": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.11.gate_proj.weight": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.11.gate_proj.weight_scale": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.11.up_proj.weight": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.11.up_proj.weight_scale": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.110.down_proj.weight": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.110.down_proj.weight_scale": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.110.gate_proj.weight": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.110.gate_proj.weight_scale": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.110.up_proj.weight": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.110.up_proj.weight_scale": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.111.down_proj.weight": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.111.down_proj.weight_scale": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.111.gate_proj.weight": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.111.gate_proj.weight_scale": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.111.up_proj.weight": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.111.up_proj.weight_scale": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.112.down_proj.weight": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.112.down_proj.weight_scale": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.112.gate_proj.weight": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.112.gate_proj.weight_scale": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.112.up_proj.weight": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.112.up_proj.weight_scale": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.113.down_proj.weight": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.113.down_proj.weight_scale": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.113.gate_proj.weight": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.113.gate_proj.weight_scale": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.113.up_proj.weight": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.113.up_proj.weight_scale": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.114.down_proj.weight": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.114.down_proj.weight_scale": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.114.gate_proj.weight": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.114.gate_proj.weight_scale": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.114.up_proj.weight": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.114.up_proj.weight_scale": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.115.down_proj.weight": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.115.down_proj.weight_scale": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.115.gate_proj.weight": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.115.gate_proj.weight_scale": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.115.up_proj.weight": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.115.up_proj.weight_scale": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.116.down_proj.weight": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.116.down_proj.weight_scale": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.116.gate_proj.weight": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.116.gate_proj.weight_scale": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.116.up_proj.weight": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.116.up_proj.weight_scale": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.117.down_proj.weight": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.117.down_proj.weight_scale": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.117.gate_proj.weight": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.117.gate_proj.weight_scale": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.117.up_proj.weight": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.117.up_proj.weight_scale": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.118.down_proj.weight": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.118.down_proj.weight_scale": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.118.gate_proj.weight": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.118.gate_proj.weight_scale": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.118.up_proj.weight": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.118.up_proj.weight_scale": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.119.down_proj.weight": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.119.down_proj.weight_scale": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.119.gate_proj.weight": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.119.gate_proj.weight_scale": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.119.up_proj.weight": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.119.up_proj.weight_scale": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.12.down_proj.weight": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.12.down_proj.weight_scale": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.12.gate_proj.weight": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.12.gate_proj.weight_scale": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.12.up_proj.weight": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.12.up_proj.weight_scale": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.120.down_proj.weight": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.120.down_proj.weight_scale": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.120.gate_proj.weight": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.120.gate_proj.weight_scale": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.120.up_proj.weight": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.120.up_proj.weight_scale": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.121.down_proj.weight": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.121.down_proj.weight_scale": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.121.gate_proj.weight": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.121.gate_proj.weight_scale": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.121.up_proj.weight": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.121.up_proj.weight_scale": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.122.down_proj.weight": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.122.down_proj.weight_scale": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.122.gate_proj.weight": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.122.gate_proj.weight_scale": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.122.up_proj.weight": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.122.up_proj.weight_scale": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.123.down_proj.weight": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.123.down_proj.weight_scale": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.123.gate_proj.weight": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.123.gate_proj.weight_scale": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.123.up_proj.weight": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.123.up_proj.weight_scale": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.124.down_proj.weight": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.124.down_proj.weight_scale": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.124.gate_proj.weight": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.124.gate_proj.weight_scale": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.124.up_proj.weight": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.124.up_proj.weight_scale": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.125.down_proj.weight": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.125.down_proj.weight_scale": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.125.gate_proj.weight": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.125.gate_proj.weight_scale": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.125.up_proj.weight": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.125.up_proj.weight_scale": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.126.down_proj.weight": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.126.down_proj.weight_scale": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.126.gate_proj.weight": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.126.gate_proj.weight_scale": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.126.up_proj.weight": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.126.up_proj.weight_scale": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.127.down_proj.weight": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.127.down_proj.weight_scale": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.127.gate_proj.weight": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.127.gate_proj.weight_scale": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.127.up_proj.weight": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.127.up_proj.weight_scale": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.128.down_proj.weight": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.128.down_proj.weight_scale": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.128.gate_proj.weight": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.128.gate_proj.weight_scale": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.128.up_proj.weight": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.128.up_proj.weight_scale": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.129.down_proj.weight": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.129.down_proj.weight_scale": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.129.gate_proj.weight": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.129.gate_proj.weight_scale": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.129.up_proj.weight": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.129.up_proj.weight_scale": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.13.down_proj.weight": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.13.down_proj.weight_scale": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.13.gate_proj.weight": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.13.gate_proj.weight_scale": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.13.up_proj.weight": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.13.up_proj.weight_scale": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.130.down_proj.weight": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.130.down_proj.weight_scale": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.130.gate_proj.weight": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.130.gate_proj.weight_scale": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.130.up_proj.weight": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.130.up_proj.weight_scale": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.131.down_proj.weight": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.131.down_proj.weight_scale": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.131.gate_proj.weight": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.131.gate_proj.weight_scale": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.131.up_proj.weight": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.131.up_proj.weight_scale": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.132.down_proj.weight": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.132.down_proj.weight_scale": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.132.gate_proj.weight": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.132.gate_proj.weight_scale": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.132.up_proj.weight": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.132.up_proj.weight_scale": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.133.down_proj.weight": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.133.down_proj.weight_scale": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.133.gate_proj.weight": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.133.gate_proj.weight_scale": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.133.up_proj.weight": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.133.up_proj.weight_scale": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.134.down_proj.weight": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.134.down_proj.weight_scale": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.134.gate_proj.weight": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.134.gate_proj.weight_scale": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.134.up_proj.weight": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.134.up_proj.weight_scale": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.135.down_proj.weight": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.135.down_proj.weight_scale": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.135.gate_proj.weight": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.135.gate_proj.weight_scale": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.135.up_proj.weight": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.135.up_proj.weight_scale": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.136.down_proj.weight": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.136.down_proj.weight_scale": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.136.gate_proj.weight": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.136.gate_proj.weight_scale": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.136.up_proj.weight": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.136.up_proj.weight_scale": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.137.down_proj.weight": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.137.down_proj.weight_scale": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.137.gate_proj.weight": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.137.gate_proj.weight_scale": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.137.up_proj.weight": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.137.up_proj.weight_scale": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.138.down_proj.weight": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.138.down_proj.weight_scale": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.138.gate_proj.weight": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.138.gate_proj.weight_scale": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.138.up_proj.weight": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.138.up_proj.weight_scale": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.139.down_proj.weight": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.139.down_proj.weight_scale": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.139.gate_proj.weight": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.139.gate_proj.weight_scale": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.139.up_proj.weight": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.139.up_proj.weight_scale": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.14.down_proj.weight": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.14.down_proj.weight_scale": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.14.gate_proj.weight": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.14.gate_proj.weight_scale": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.14.up_proj.weight": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.14.up_proj.weight_scale": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.140.down_proj.weight": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.140.down_proj.weight_scale": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.140.gate_proj.weight": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.140.gate_proj.weight_scale": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.140.up_proj.weight": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.140.up_proj.weight_scale": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.141.down_proj.weight": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.141.down_proj.weight_scale": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.141.gate_proj.weight": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.141.gate_proj.weight_scale": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.141.up_proj.weight": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.141.up_proj.weight_scale": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.142.down_proj.weight": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.142.down_proj.weight_scale": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.142.gate_proj.weight": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.142.gate_proj.weight_scale": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.142.up_proj.weight": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.142.up_proj.weight_scale": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.143.down_proj.weight": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.143.down_proj.weight_scale": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.143.gate_proj.weight": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.143.gate_proj.weight_scale": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.143.up_proj.weight": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.143.up_proj.weight_scale": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.144.down_proj.weight": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.144.down_proj.weight_scale": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.144.gate_proj.weight": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.144.gate_proj.weight_scale": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.144.up_proj.weight": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.144.up_proj.weight_scale": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.145.down_proj.weight": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.145.down_proj.weight_scale": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.145.gate_proj.weight": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.145.gate_proj.weight_scale": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.145.up_proj.weight": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.145.up_proj.weight_scale": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.146.down_proj.weight": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.146.down_proj.weight_scale": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.146.gate_proj.weight": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.146.gate_proj.weight_scale": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.146.up_proj.weight": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.146.up_proj.weight_scale": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.147.down_proj.weight": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.147.down_proj.weight_scale": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.147.gate_proj.weight": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.147.gate_proj.weight_scale": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.147.up_proj.weight": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.147.up_proj.weight_scale": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.148.down_proj.weight": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.148.down_proj.weight_scale": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.148.gate_proj.weight": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.148.gate_proj.weight_scale": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.148.up_proj.weight": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.148.up_proj.weight_scale": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.149.down_proj.weight": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.149.down_proj.weight_scale": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.149.gate_proj.weight": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.149.gate_proj.weight_scale": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.149.up_proj.weight": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.149.up_proj.weight_scale": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.15.down_proj.weight": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.15.down_proj.weight_scale": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.15.gate_proj.weight": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.15.gate_proj.weight_scale": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.15.up_proj.weight": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.15.up_proj.weight_scale": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.150.down_proj.weight": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.150.down_proj.weight_scale": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.150.gate_proj.weight": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.150.gate_proj.weight_scale": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.150.up_proj.weight": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.150.up_proj.weight_scale": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.151.down_proj.weight": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.151.down_proj.weight_scale": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.151.gate_proj.weight": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.151.gate_proj.weight_scale": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.151.up_proj.weight": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.151.up_proj.weight_scale": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.152.down_proj.weight": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.152.down_proj.weight_scale": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.152.gate_proj.weight": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.152.gate_proj.weight_scale": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.152.up_proj.weight": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.152.up_proj.weight_scale": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.153.down_proj.weight": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.153.down_proj.weight_scale": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.153.gate_proj.weight": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.153.gate_proj.weight_scale": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.153.up_proj.weight": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.153.up_proj.weight_scale": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.154.down_proj.weight": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.154.down_proj.weight_scale": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.154.gate_proj.weight": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.154.gate_proj.weight_scale": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.154.up_proj.weight": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.154.up_proj.weight_scale": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.155.down_proj.weight": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.155.down_proj.weight_scale": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.155.gate_proj.weight": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.155.gate_proj.weight_scale": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.155.up_proj.weight": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.155.up_proj.weight_scale": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.156.down_proj.weight": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.156.down_proj.weight_scale": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.156.gate_proj.weight": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.156.gate_proj.weight_scale": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.156.up_proj.weight": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.156.up_proj.weight_scale": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.157.down_proj.weight": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.157.down_proj.weight_scale": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.157.gate_proj.weight": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.157.gate_proj.weight_scale": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.157.up_proj.weight": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.157.up_proj.weight_scale": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.158.down_proj.weight": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.158.down_proj.weight_scale": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.158.gate_proj.weight": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.158.gate_proj.weight_scale": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.158.up_proj.weight": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.158.up_proj.weight_scale": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.159.down_proj.weight": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.159.down_proj.weight_scale": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.159.gate_proj.weight": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.159.gate_proj.weight_scale": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.159.up_proj.weight": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.159.up_proj.weight_scale": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.16.down_proj.weight": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.16.down_proj.weight_scale": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.16.gate_proj.weight": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.16.gate_proj.weight_scale": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.16.up_proj.weight": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.16.up_proj.weight_scale": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.17.down_proj.weight": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.17.down_proj.weight_scale": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.17.gate_proj.weight": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.17.gate_proj.weight_scale": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.17.up_proj.weight": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.17.up_proj.weight_scale": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.18.down_proj.weight": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.18.down_proj.weight_scale": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.18.gate_proj.weight": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.18.gate_proj.weight_scale": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.18.up_proj.weight": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.18.up_proj.weight_scale": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.19.down_proj.weight": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.19.down_proj.weight_scale": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.19.gate_proj.weight": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.19.gate_proj.weight_scale": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.19.up_proj.weight": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.19.up_proj.weight_scale": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.2.down_proj.weight": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.2.down_proj.weight_scale": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.2.gate_proj.weight": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.2.gate_proj.weight_scale": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.2.up_proj.weight": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.2.up_proj.weight_scale": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.20.down_proj.weight": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.20.down_proj.weight_scale": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.20.gate_proj.weight": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.20.gate_proj.weight_scale": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.20.up_proj.weight": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.20.up_proj.weight_scale": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.21.down_proj.weight": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.21.down_proj.weight_scale": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.21.gate_proj.weight": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.21.gate_proj.weight_scale": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.21.up_proj.weight": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.21.up_proj.weight_scale": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.22.down_proj.weight": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.22.down_proj.weight_scale": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.22.gate_proj.weight": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.22.gate_proj.weight_scale": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.22.up_proj.weight": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.22.up_proj.weight_scale": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.23.down_proj.weight": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.23.down_proj.weight_scale": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.23.gate_proj.weight": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.23.gate_proj.weight_scale": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.23.up_proj.weight": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.23.up_proj.weight_scale": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.24.down_proj.weight": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.24.down_proj.weight_scale": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.24.gate_proj.weight": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.24.gate_proj.weight_scale": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.24.up_proj.weight": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.24.up_proj.weight_scale": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.25.down_proj.weight": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.25.down_proj.weight_scale": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.25.gate_proj.weight": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.25.gate_proj.weight_scale": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.25.up_proj.weight": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.25.up_proj.weight_scale": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.26.down_proj.weight": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.26.down_proj.weight_scale": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.26.gate_proj.weight": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.26.gate_proj.weight_scale": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.26.up_proj.weight": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.26.up_proj.weight_scale": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.27.down_proj.weight": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.27.down_proj.weight_scale": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.27.gate_proj.weight": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.27.gate_proj.weight_scale": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.27.up_proj.weight": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.27.up_proj.weight_scale": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.28.down_proj.weight": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.28.down_proj.weight_scale": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.28.gate_proj.weight": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.28.gate_proj.weight_scale": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.28.up_proj.weight": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.28.up_proj.weight_scale": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.29.down_proj.weight": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.29.down_proj.weight_scale": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.29.gate_proj.weight": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.29.gate_proj.weight_scale": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.29.up_proj.weight": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.29.up_proj.weight_scale": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.3.down_proj.weight": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.3.down_proj.weight_scale": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.3.gate_proj.weight": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.3.gate_proj.weight_scale": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.3.up_proj.weight": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.3.up_proj.weight_scale": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.30.down_proj.weight": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.30.down_proj.weight_scale": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.30.gate_proj.weight": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.30.gate_proj.weight_scale": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.30.up_proj.weight": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.30.up_proj.weight_scale": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.31.down_proj.weight": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.31.down_proj.weight_scale": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.31.gate_proj.weight": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.31.gate_proj.weight_scale": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.31.up_proj.weight": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.31.up_proj.weight_scale": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.32.down_proj.weight": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.32.down_proj.weight_scale": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.32.gate_proj.weight": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.32.gate_proj.weight_scale": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.32.up_proj.weight": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.32.up_proj.weight_scale": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.33.down_proj.weight": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.33.down_proj.weight_scale": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.33.gate_proj.weight": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.33.gate_proj.weight_scale": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.33.up_proj.weight": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.33.up_proj.weight_scale": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.34.down_proj.weight": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.34.down_proj.weight_scale": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.34.gate_proj.weight": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.34.gate_proj.weight_scale": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.34.up_proj.weight": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.34.up_proj.weight_scale": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.35.down_proj.weight": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.35.down_proj.weight_scale": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.35.gate_proj.weight": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.35.gate_proj.weight_scale": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.35.up_proj.weight": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.35.up_proj.weight_scale": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.36.down_proj.weight": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.36.down_proj.weight_scale": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.36.gate_proj.weight": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.36.gate_proj.weight_scale": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.36.up_proj.weight": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.36.up_proj.weight_scale": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.37.down_proj.weight": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.37.down_proj.weight_scale": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.37.gate_proj.weight": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.37.gate_proj.weight_scale": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.37.up_proj.weight": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.37.up_proj.weight_scale": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.38.down_proj.weight": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.38.down_proj.weight_scale": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.38.gate_proj.weight": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.38.gate_proj.weight_scale": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.38.up_proj.weight": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.38.up_proj.weight_scale": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.39.down_proj.weight": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.39.down_proj.weight_scale": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.39.gate_proj.weight": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.39.gate_proj.weight_scale": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.39.up_proj.weight": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.39.up_proj.weight_scale": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.4.down_proj.weight": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.4.down_proj.weight_scale": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.4.gate_proj.weight": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.4.gate_proj.weight_scale": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.4.up_proj.weight": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.4.up_proj.weight_scale": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.40.down_proj.weight": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.40.down_proj.weight_scale": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.40.gate_proj.weight": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.40.gate_proj.weight_scale": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.40.up_proj.weight": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.40.up_proj.weight_scale": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.41.down_proj.weight": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.41.down_proj.weight_scale": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.41.gate_proj.weight": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.41.gate_proj.weight_scale": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.41.up_proj.weight": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.41.up_proj.weight_scale": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.42.down_proj.weight": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.42.down_proj.weight_scale": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.42.gate_proj.weight": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.42.gate_proj.weight_scale": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.42.up_proj.weight": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.42.up_proj.weight_scale": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.43.down_proj.weight": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.43.down_proj.weight_scale": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.43.gate_proj.weight": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.43.gate_proj.weight_scale": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.43.up_proj.weight": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.43.up_proj.weight_scale": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.44.down_proj.weight": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.44.down_proj.weight_scale": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.44.gate_proj.weight": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.44.gate_proj.weight_scale": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.44.up_proj.weight": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.44.up_proj.weight_scale": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.45.down_proj.weight": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.45.down_proj.weight_scale": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.45.gate_proj.weight": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.45.gate_proj.weight_scale": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.45.up_proj.weight": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.45.up_proj.weight_scale": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.46.down_proj.weight": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.46.down_proj.weight_scale": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.46.gate_proj.weight": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.46.gate_proj.weight_scale": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.46.up_proj.weight": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.46.up_proj.weight_scale": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.47.down_proj.weight": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.47.down_proj.weight_scale": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.47.gate_proj.weight": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.47.gate_proj.weight_scale": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.47.up_proj.weight": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.47.up_proj.weight_scale": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.48.down_proj.weight": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.48.down_proj.weight_scale": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.48.gate_proj.weight": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.48.gate_proj.weight_scale": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.48.up_proj.weight": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.48.up_proj.weight_scale": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.49.down_proj.weight": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.49.down_proj.weight_scale": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.49.gate_proj.weight": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.49.gate_proj.weight_scale": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.49.up_proj.weight": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.49.up_proj.weight_scale": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.5.down_proj.weight": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.5.down_proj.weight_scale": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.5.gate_proj.weight": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.5.gate_proj.weight_scale": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.5.up_proj.weight": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.5.up_proj.weight_scale": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.50.down_proj.weight": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.50.down_proj.weight_scale": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.50.gate_proj.weight": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.50.gate_proj.weight_scale": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.50.up_proj.weight": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.50.up_proj.weight_scale": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.51.down_proj.weight": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.51.down_proj.weight_scale": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.51.gate_proj.weight": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.51.gate_proj.weight_scale": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.51.up_proj.weight": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.51.up_proj.weight_scale": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.52.down_proj.weight": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.52.down_proj.weight_scale": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.52.gate_proj.weight": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.52.gate_proj.weight_scale": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.52.up_proj.weight": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.52.up_proj.weight_scale": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.53.down_proj.weight": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.53.down_proj.weight_scale": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.53.gate_proj.weight": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.53.gate_proj.weight_scale": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.53.up_proj.weight": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.53.up_proj.weight_scale": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.54.down_proj.weight": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.54.down_proj.weight_scale": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.54.gate_proj.weight": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.54.gate_proj.weight_scale": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.54.up_proj.weight": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.54.up_proj.weight_scale": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.55.down_proj.weight": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.55.down_proj.weight_scale": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.55.gate_proj.weight": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.55.gate_proj.weight_scale": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.55.up_proj.weight": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.55.up_proj.weight_scale": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.56.down_proj.weight": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.56.down_proj.weight_scale": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.56.gate_proj.weight": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.56.gate_proj.weight_scale": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.56.up_proj.weight": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.56.up_proj.weight_scale": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.57.down_proj.weight": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.57.down_proj.weight_scale": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.57.gate_proj.weight": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.57.gate_proj.weight_scale": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.57.up_proj.weight": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.57.up_proj.weight_scale": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.58.down_proj.weight": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.58.down_proj.weight_scale": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.58.gate_proj.weight": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.58.gate_proj.weight_scale": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.58.up_proj.weight": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.58.up_proj.weight_scale": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.59.down_proj.weight": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.59.down_proj.weight_scale": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.59.gate_proj.weight": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.59.gate_proj.weight_scale": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.59.up_proj.weight": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.59.up_proj.weight_scale": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.6.down_proj.weight": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.6.down_proj.weight_scale": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.6.gate_proj.weight": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.6.gate_proj.weight_scale": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.6.up_proj.weight": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.6.up_proj.weight_scale": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.60.down_proj.weight": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.60.down_proj.weight_scale": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.60.gate_proj.weight": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.60.gate_proj.weight_scale": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.60.up_proj.weight": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.60.up_proj.weight_scale": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.61.down_proj.weight": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.61.down_proj.weight_scale": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.61.gate_proj.weight": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.61.gate_proj.weight_scale": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.61.up_proj.weight": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.61.up_proj.weight_scale": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.62.down_proj.weight": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.62.down_proj.weight_scale": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.62.gate_proj.weight": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.62.gate_proj.weight_scale": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.62.up_proj.weight": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.62.up_proj.weight_scale": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.63.down_proj.weight": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.63.down_proj.weight_scale": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.63.gate_proj.weight": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.63.gate_proj.weight_scale": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.63.up_proj.weight": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.63.up_proj.weight_scale": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.64.down_proj.weight": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.64.down_proj.weight_scale": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.64.gate_proj.weight": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.64.gate_proj.weight_scale": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.64.up_proj.weight": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.64.up_proj.weight_scale": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.65.down_proj.weight": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.65.down_proj.weight_scale": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.65.gate_proj.weight": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.65.gate_proj.weight_scale": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.65.up_proj.weight": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.65.up_proj.weight_scale": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.66.down_proj.weight": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.66.down_proj.weight_scale": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.66.gate_proj.weight": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.66.gate_proj.weight_scale": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.66.up_proj.weight": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.66.up_proj.weight_scale": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.67.down_proj.weight": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.67.down_proj.weight_scale": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.67.gate_proj.weight": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.67.gate_proj.weight_scale": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.67.up_proj.weight": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.67.up_proj.weight_scale": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.68.down_proj.weight": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.68.down_proj.weight_scale": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.68.gate_proj.weight": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.68.gate_proj.weight_scale": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.68.up_proj.weight": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.68.up_proj.weight_scale": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.69.down_proj.weight": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.69.down_proj.weight_scale": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.69.gate_proj.weight": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.69.gate_proj.weight_scale": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.69.up_proj.weight": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.69.up_proj.weight_scale": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.7.down_proj.weight": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.7.down_proj.weight_scale": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.7.gate_proj.weight": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.7.gate_proj.weight_scale": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.7.up_proj.weight": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.7.up_proj.weight_scale": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.70.down_proj.weight": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.70.down_proj.weight_scale": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.70.gate_proj.weight": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.70.gate_proj.weight_scale": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.70.up_proj.weight": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.70.up_proj.weight_scale": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.71.down_proj.weight": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.71.down_proj.weight_scale": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.71.gate_proj.weight": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.71.gate_proj.weight_scale": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.71.up_proj.weight": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.71.up_proj.weight_scale": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.72.down_proj.weight": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.72.down_proj.weight_scale": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.72.gate_proj.weight": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.72.gate_proj.weight_scale": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.72.up_proj.weight": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.72.up_proj.weight_scale": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.73.down_proj.weight": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.73.down_proj.weight_scale": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.73.gate_proj.weight": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.73.gate_proj.weight_scale": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.73.up_proj.weight": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.73.up_proj.weight_scale": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.74.down_proj.weight": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.74.down_proj.weight_scale": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.74.gate_proj.weight": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.74.gate_proj.weight_scale": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.74.up_proj.weight": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.74.up_proj.weight_scale": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.75.down_proj.weight": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.75.down_proj.weight_scale": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.75.gate_proj.weight": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.75.gate_proj.weight_scale": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.75.up_proj.weight": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.75.up_proj.weight_scale": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.76.down_proj.weight": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.76.down_proj.weight_scale": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.76.gate_proj.weight": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.76.gate_proj.weight_scale": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.76.up_proj.weight": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.76.up_proj.weight_scale": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.77.down_proj.weight": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.77.down_proj.weight_scale": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.77.gate_proj.weight": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.77.gate_proj.weight_scale": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.77.up_proj.weight": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.77.up_proj.weight_scale": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.78.down_proj.weight": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.78.down_proj.weight_scale": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.78.gate_proj.weight": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.78.gate_proj.weight_scale": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.78.up_proj.weight": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.78.up_proj.weight_scale": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.79.down_proj.weight": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.79.down_proj.weight_scale": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.79.gate_proj.weight": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.79.gate_proj.weight_scale": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.79.up_proj.weight": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.79.up_proj.weight_scale": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.8.down_proj.weight": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.8.down_proj.weight_scale": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.8.gate_proj.weight": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.8.gate_proj.weight_scale": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.8.up_proj.weight": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.8.up_proj.weight_scale": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.80.down_proj.weight": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.80.down_proj.weight_scale": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.80.gate_proj.weight": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.80.gate_proj.weight_scale": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.80.up_proj.weight": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.80.up_proj.weight_scale": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.81.down_proj.weight": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.81.down_proj.weight_scale": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.81.gate_proj.weight": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.81.gate_proj.weight_scale": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.81.up_proj.weight": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.81.up_proj.weight_scale": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.82.down_proj.weight": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.82.down_proj.weight_scale": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.82.gate_proj.weight": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.82.gate_proj.weight_scale": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.82.up_proj.weight": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.82.up_proj.weight_scale": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.83.down_proj.weight": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.83.down_proj.weight_scale": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.83.gate_proj.weight": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.83.gate_proj.weight_scale": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.83.up_proj.weight": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.83.up_proj.weight_scale": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.84.down_proj.weight": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.84.down_proj.weight_scale": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.84.gate_proj.weight": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.84.gate_proj.weight_scale": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.84.up_proj.weight": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.84.up_proj.weight_scale": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.85.down_proj.weight": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.85.down_proj.weight_scale": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.85.gate_proj.weight": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.85.gate_proj.weight_scale": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.85.up_proj.weight": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.85.up_proj.weight_scale": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.86.down_proj.weight": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.86.down_proj.weight_scale": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.86.gate_proj.weight": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.86.gate_proj.weight_scale": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.86.up_proj.weight": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.86.up_proj.weight_scale": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.87.down_proj.weight": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.87.down_proj.weight_scale": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.87.gate_proj.weight": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.87.gate_proj.weight_scale": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.87.up_proj.weight": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.87.up_proj.weight_scale": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.88.down_proj.weight": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.88.down_proj.weight_scale": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.88.gate_proj.weight": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.88.gate_proj.weight_scale": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.88.up_proj.weight": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.88.up_proj.weight_scale": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.89.down_proj.weight": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.89.down_proj.weight_scale": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.89.gate_proj.weight": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.89.gate_proj.weight_scale": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.89.up_proj.weight": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.89.up_proj.weight_scale": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.9.down_proj.weight": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.9.down_proj.weight_scale": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.9.gate_proj.weight": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.9.gate_proj.weight_scale": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.9.up_proj.weight": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.9.up_proj.weight_scale": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.90.down_proj.weight": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.90.down_proj.weight_scale": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.90.gate_proj.weight": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.90.gate_proj.weight_scale": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.90.up_proj.weight": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.90.up_proj.weight_scale": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.91.down_proj.weight": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.91.down_proj.weight_scale": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.91.gate_proj.weight": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.91.gate_proj.weight_scale": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.91.up_proj.weight": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.91.up_proj.weight_scale": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.92.down_proj.weight": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.92.down_proj.weight_scale": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.92.gate_proj.weight": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.92.gate_proj.weight_scale": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.92.up_proj.weight": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.92.up_proj.weight_scale": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.93.down_proj.weight": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.93.down_proj.weight_scale": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.93.gate_proj.weight": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.93.gate_proj.weight_scale": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.93.up_proj.weight": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.93.up_proj.weight_scale": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.94.down_proj.weight": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.94.down_proj.weight_scale": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.94.gate_proj.weight": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.94.gate_proj.weight_scale": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.94.up_proj.weight": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.94.up_proj.weight_scale": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.95.down_proj.weight": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.95.down_proj.weight_scale": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.95.gate_proj.weight": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.95.gate_proj.weight_scale": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.95.up_proj.weight": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.95.up_proj.weight_scale": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.96.down_proj.weight": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.96.down_proj.weight_scale": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.96.gate_proj.weight": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.96.gate_proj.weight_scale": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.96.up_proj.weight": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.96.up_proj.weight_scale": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.97.down_proj.weight": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.97.down_proj.weight_scale": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.97.gate_proj.weight": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.97.gate_proj.weight_scale": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.97.up_proj.weight": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.97.up_proj.weight_scale": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.98.down_proj.weight": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.98.down_proj.weight_scale": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.98.gate_proj.weight": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.98.gate_proj.weight_scale": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.98.up_proj.weight": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.98.up_proj.weight_scale": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.99.down_proj.weight": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.99.down_proj.weight_scale": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.99.gate_proj.weight": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.99.gate_proj.weight_scale": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.99.up_proj.weight": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.99.up_proj.weight_scale": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.gate.e_score_correction_bias": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.gate.weight": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.shared_experts.down_proj.weight": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.shared_experts.down_proj.weight_scale": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.shared_experts.gate_proj.weight": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.shared_experts.gate_proj.weight_scale": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.shared_experts.up_proj.weight": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.shared_experts.up_proj.weight_scale": "model-00064-of-00092.safetensors",
+ "model.layers.63.post_attention_layernorm.weight": "model-00064-of-00092.safetensors",
+ "model.layers.63.self_attn.k_norm.weight": "model-00064-of-00092.safetensors",
+ "model.layers.63.self_attn.k_proj.bias": "model-00064-of-00092.safetensors",
+ "model.layers.63.self_attn.k_proj.weight": "model-00064-of-00092.safetensors",
+ "model.layers.63.self_attn.k_proj.weight_scale": "model-00064-of-00092.safetensors",
+ "model.layers.63.self_attn.o_proj.weight": "model-00064-of-00092.safetensors",
+ "model.layers.63.self_attn.o_proj.weight_scale": "model-00064-of-00092.safetensors",
+ "model.layers.63.self_attn.q_norm.weight": "model-00064-of-00092.safetensors",
+ "model.layers.63.self_attn.q_proj.bias": "model-00064-of-00092.safetensors",
+ "model.layers.63.self_attn.q_proj.weight": "model-00064-of-00092.safetensors",
+ "model.layers.63.self_attn.q_proj.weight_scale": "model-00064-of-00092.safetensors",
+ "model.layers.63.self_attn.v_proj.bias": "model-00064-of-00092.safetensors",
+ "model.layers.63.self_attn.v_proj.weight": "model-00064-of-00092.safetensors",
+ "model.layers.63.self_attn.v_proj.weight_scale": "model-00064-of-00092.safetensors",
+ "model.layers.64.input_layernorm.weight": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.0.down_proj.weight": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.0.down_proj.weight_scale": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.0.gate_proj.weight": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.0.gate_proj.weight_scale": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.0.up_proj.weight": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.0.up_proj.weight_scale": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.1.down_proj.weight": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.1.down_proj.weight_scale": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.1.gate_proj.weight": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.1.gate_proj.weight_scale": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.1.up_proj.weight": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.1.up_proj.weight_scale": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.10.down_proj.weight": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.10.down_proj.weight_scale": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.10.gate_proj.weight": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.10.gate_proj.weight_scale": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.10.up_proj.weight": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.10.up_proj.weight_scale": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.100.down_proj.weight": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.100.down_proj.weight_scale": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.100.gate_proj.weight": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.100.gate_proj.weight_scale": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.100.up_proj.weight": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.100.up_proj.weight_scale": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.101.down_proj.weight": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.101.down_proj.weight_scale": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.101.gate_proj.weight": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.101.gate_proj.weight_scale": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.101.up_proj.weight": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.101.up_proj.weight_scale": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.102.down_proj.weight": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.102.down_proj.weight_scale": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.102.gate_proj.weight": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.102.gate_proj.weight_scale": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.102.up_proj.weight": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.102.up_proj.weight_scale": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.103.down_proj.weight": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.103.down_proj.weight_scale": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.103.gate_proj.weight": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.103.gate_proj.weight_scale": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.103.up_proj.weight": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.103.up_proj.weight_scale": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.104.down_proj.weight": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.104.down_proj.weight_scale": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.104.gate_proj.weight": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.104.gate_proj.weight_scale": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.104.up_proj.weight": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.104.up_proj.weight_scale": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.105.down_proj.weight": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.105.down_proj.weight_scale": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.105.gate_proj.weight": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.105.gate_proj.weight_scale": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.105.up_proj.weight": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.105.up_proj.weight_scale": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.106.down_proj.weight": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.106.down_proj.weight_scale": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.106.gate_proj.weight": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.106.gate_proj.weight_scale": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.106.up_proj.weight": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.106.up_proj.weight_scale": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.107.down_proj.weight": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.107.down_proj.weight_scale": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.107.gate_proj.weight": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.107.gate_proj.weight_scale": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.107.up_proj.weight": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.107.up_proj.weight_scale": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.108.down_proj.weight": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.108.down_proj.weight_scale": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.108.gate_proj.weight": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.108.gate_proj.weight_scale": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.108.up_proj.weight": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.108.up_proj.weight_scale": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.109.down_proj.weight": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.109.down_proj.weight_scale": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.109.gate_proj.weight": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.109.gate_proj.weight_scale": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.109.up_proj.weight": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.109.up_proj.weight_scale": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.11.down_proj.weight": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.11.down_proj.weight_scale": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.11.gate_proj.weight": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.11.gate_proj.weight_scale": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.11.up_proj.weight": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.11.up_proj.weight_scale": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.110.down_proj.weight": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.110.down_proj.weight_scale": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.110.gate_proj.weight": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.110.gate_proj.weight_scale": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.110.up_proj.weight": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.110.up_proj.weight_scale": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.111.down_proj.weight": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.111.down_proj.weight_scale": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.111.gate_proj.weight": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.111.gate_proj.weight_scale": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.111.up_proj.weight": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.111.up_proj.weight_scale": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.112.down_proj.weight": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.112.down_proj.weight_scale": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.112.gate_proj.weight": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.112.gate_proj.weight_scale": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.112.up_proj.weight": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.112.up_proj.weight_scale": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.113.down_proj.weight": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.113.down_proj.weight_scale": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.113.gate_proj.weight": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.113.gate_proj.weight_scale": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.113.up_proj.weight": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.113.up_proj.weight_scale": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.114.down_proj.weight": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.114.down_proj.weight_scale": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.114.gate_proj.weight": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.114.gate_proj.weight_scale": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.114.up_proj.weight": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.114.up_proj.weight_scale": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.115.down_proj.weight": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.115.down_proj.weight_scale": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.115.gate_proj.weight": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.115.gate_proj.weight_scale": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.115.up_proj.weight": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.115.up_proj.weight_scale": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.116.down_proj.weight": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.116.down_proj.weight_scale": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.116.gate_proj.weight": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.116.gate_proj.weight_scale": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.116.up_proj.weight": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.116.up_proj.weight_scale": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.117.down_proj.weight": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.117.down_proj.weight_scale": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.117.gate_proj.weight": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.117.gate_proj.weight_scale": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.117.up_proj.weight": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.117.up_proj.weight_scale": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.118.down_proj.weight": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.118.down_proj.weight_scale": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.118.gate_proj.weight": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.118.gate_proj.weight_scale": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.118.up_proj.weight": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.118.up_proj.weight_scale": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.119.down_proj.weight": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.119.down_proj.weight_scale": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.119.gate_proj.weight": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.119.gate_proj.weight_scale": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.119.up_proj.weight": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.119.up_proj.weight_scale": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.12.down_proj.weight": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.12.down_proj.weight_scale": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.12.gate_proj.weight": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.12.gate_proj.weight_scale": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.12.up_proj.weight": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.12.up_proj.weight_scale": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.120.down_proj.weight": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.120.down_proj.weight_scale": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.120.gate_proj.weight": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.120.gate_proj.weight_scale": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.120.up_proj.weight": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.120.up_proj.weight_scale": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.121.down_proj.weight": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.121.down_proj.weight_scale": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.121.gate_proj.weight": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.121.gate_proj.weight_scale": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.121.up_proj.weight": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.121.up_proj.weight_scale": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.122.down_proj.weight": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.122.down_proj.weight_scale": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.122.gate_proj.weight": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.122.gate_proj.weight_scale": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.122.up_proj.weight": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.122.up_proj.weight_scale": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.123.down_proj.weight": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.123.down_proj.weight_scale": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.123.gate_proj.weight": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.123.gate_proj.weight_scale": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.123.up_proj.weight": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.123.up_proj.weight_scale": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.124.down_proj.weight": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.124.down_proj.weight_scale": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.124.gate_proj.weight": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.124.gate_proj.weight_scale": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.124.up_proj.weight": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.124.up_proj.weight_scale": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.125.down_proj.weight": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.125.down_proj.weight_scale": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.125.gate_proj.weight": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.125.gate_proj.weight_scale": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.125.up_proj.weight": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.125.up_proj.weight_scale": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.126.down_proj.weight": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.126.down_proj.weight_scale": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.126.gate_proj.weight": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.126.gate_proj.weight_scale": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.126.up_proj.weight": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.126.up_proj.weight_scale": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.127.down_proj.weight": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.127.down_proj.weight_scale": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.127.gate_proj.weight": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.127.gate_proj.weight_scale": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.127.up_proj.weight": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.127.up_proj.weight_scale": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.128.down_proj.weight": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.128.down_proj.weight_scale": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.128.gate_proj.weight": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.128.gate_proj.weight_scale": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.128.up_proj.weight": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.128.up_proj.weight_scale": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.129.down_proj.weight": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.129.down_proj.weight_scale": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.129.gate_proj.weight": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.129.gate_proj.weight_scale": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.129.up_proj.weight": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.129.up_proj.weight_scale": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.13.down_proj.weight": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.13.down_proj.weight_scale": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.13.gate_proj.weight": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.13.gate_proj.weight_scale": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.13.up_proj.weight": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.13.up_proj.weight_scale": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.130.down_proj.weight": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.130.down_proj.weight_scale": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.130.gate_proj.weight": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.130.gate_proj.weight_scale": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.130.up_proj.weight": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.130.up_proj.weight_scale": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.131.down_proj.weight": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.131.down_proj.weight_scale": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.131.gate_proj.weight": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.131.gate_proj.weight_scale": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.131.up_proj.weight": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.131.up_proj.weight_scale": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.132.down_proj.weight": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.132.down_proj.weight_scale": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.132.gate_proj.weight": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.132.gate_proj.weight_scale": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.132.up_proj.weight": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.132.up_proj.weight_scale": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.133.down_proj.weight": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.133.down_proj.weight_scale": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.133.gate_proj.weight": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.133.gate_proj.weight_scale": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.133.up_proj.weight": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.133.up_proj.weight_scale": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.134.down_proj.weight": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.134.down_proj.weight_scale": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.134.gate_proj.weight": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.134.gate_proj.weight_scale": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.134.up_proj.weight": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.134.up_proj.weight_scale": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.135.down_proj.weight": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.135.down_proj.weight_scale": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.135.gate_proj.weight": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.135.gate_proj.weight_scale": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.135.up_proj.weight": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.135.up_proj.weight_scale": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.136.down_proj.weight": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.136.down_proj.weight_scale": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.136.gate_proj.weight": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.136.gate_proj.weight_scale": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.136.up_proj.weight": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.136.up_proj.weight_scale": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.137.down_proj.weight": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.137.down_proj.weight_scale": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.137.gate_proj.weight": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.137.gate_proj.weight_scale": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.137.up_proj.weight": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.137.up_proj.weight_scale": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.138.down_proj.weight": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.138.down_proj.weight_scale": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.138.gate_proj.weight": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.138.gate_proj.weight_scale": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.138.up_proj.weight": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.138.up_proj.weight_scale": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.139.down_proj.weight": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.139.down_proj.weight_scale": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.139.gate_proj.weight": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.139.gate_proj.weight_scale": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.139.up_proj.weight": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.139.up_proj.weight_scale": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.14.down_proj.weight": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.14.down_proj.weight_scale": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.14.gate_proj.weight": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.14.gate_proj.weight_scale": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.14.up_proj.weight": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.14.up_proj.weight_scale": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.140.down_proj.weight": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.140.down_proj.weight_scale": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.140.gate_proj.weight": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.140.gate_proj.weight_scale": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.140.up_proj.weight": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.140.up_proj.weight_scale": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.141.down_proj.weight": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.141.down_proj.weight_scale": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.141.gate_proj.weight": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.141.gate_proj.weight_scale": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.141.up_proj.weight": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.141.up_proj.weight_scale": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.142.down_proj.weight": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.142.down_proj.weight_scale": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.142.gate_proj.weight": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.142.gate_proj.weight_scale": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.142.up_proj.weight": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.142.up_proj.weight_scale": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.143.down_proj.weight": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.143.down_proj.weight_scale": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.143.gate_proj.weight": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.143.gate_proj.weight_scale": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.143.up_proj.weight": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.143.up_proj.weight_scale": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.144.down_proj.weight": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.144.down_proj.weight_scale": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.144.gate_proj.weight": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.144.gate_proj.weight_scale": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.144.up_proj.weight": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.144.up_proj.weight_scale": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.145.down_proj.weight": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.145.down_proj.weight_scale": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.145.gate_proj.weight": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.145.gate_proj.weight_scale": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.145.up_proj.weight": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.145.up_proj.weight_scale": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.146.down_proj.weight": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.146.down_proj.weight_scale": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.146.gate_proj.weight": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.146.gate_proj.weight_scale": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.146.up_proj.weight": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.146.up_proj.weight_scale": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.147.down_proj.weight": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.147.down_proj.weight_scale": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.147.gate_proj.weight": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.147.gate_proj.weight_scale": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.147.up_proj.weight": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.147.up_proj.weight_scale": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.148.down_proj.weight": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.148.down_proj.weight_scale": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.148.gate_proj.weight": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.148.gate_proj.weight_scale": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.148.up_proj.weight": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.148.up_proj.weight_scale": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.149.down_proj.weight": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.149.down_proj.weight_scale": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.149.gate_proj.weight": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.149.gate_proj.weight_scale": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.149.up_proj.weight": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.149.up_proj.weight_scale": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.15.down_proj.weight": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.15.down_proj.weight_scale": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.15.gate_proj.weight": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.15.gate_proj.weight_scale": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.15.up_proj.weight": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.15.up_proj.weight_scale": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.150.down_proj.weight": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.150.down_proj.weight_scale": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.150.gate_proj.weight": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.150.gate_proj.weight_scale": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.150.up_proj.weight": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.150.up_proj.weight_scale": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.151.down_proj.weight": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.151.down_proj.weight_scale": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.151.gate_proj.weight": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.151.gate_proj.weight_scale": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.151.up_proj.weight": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.151.up_proj.weight_scale": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.152.down_proj.weight": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.152.down_proj.weight_scale": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.152.gate_proj.weight": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.152.gate_proj.weight_scale": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.152.up_proj.weight": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.152.up_proj.weight_scale": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.153.down_proj.weight": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.153.down_proj.weight_scale": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.153.gate_proj.weight": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.153.gate_proj.weight_scale": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.153.up_proj.weight": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.153.up_proj.weight_scale": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.154.down_proj.weight": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.154.down_proj.weight_scale": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.154.gate_proj.weight": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.154.gate_proj.weight_scale": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.154.up_proj.weight": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.154.up_proj.weight_scale": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.155.down_proj.weight": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.155.down_proj.weight_scale": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.155.gate_proj.weight": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.155.gate_proj.weight_scale": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.155.up_proj.weight": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.155.up_proj.weight_scale": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.156.down_proj.weight": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.156.down_proj.weight_scale": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.156.gate_proj.weight": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.156.gate_proj.weight_scale": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.156.up_proj.weight": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.156.up_proj.weight_scale": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.157.down_proj.weight": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.157.down_proj.weight_scale": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.157.gate_proj.weight": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.157.gate_proj.weight_scale": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.157.up_proj.weight": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.157.up_proj.weight_scale": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.158.down_proj.weight": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.158.down_proj.weight_scale": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.158.gate_proj.weight": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.158.gate_proj.weight_scale": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.158.up_proj.weight": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.158.up_proj.weight_scale": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.159.down_proj.weight": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.159.down_proj.weight_scale": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.159.gate_proj.weight": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.159.gate_proj.weight_scale": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.159.up_proj.weight": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.159.up_proj.weight_scale": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.16.down_proj.weight": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.16.down_proj.weight_scale": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.16.gate_proj.weight": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.16.gate_proj.weight_scale": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.16.up_proj.weight": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.16.up_proj.weight_scale": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.17.down_proj.weight": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.17.down_proj.weight_scale": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.17.gate_proj.weight": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.17.gate_proj.weight_scale": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.17.up_proj.weight": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.17.up_proj.weight_scale": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.18.down_proj.weight": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.18.down_proj.weight_scale": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.18.gate_proj.weight": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.18.gate_proj.weight_scale": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.18.up_proj.weight": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.18.up_proj.weight_scale": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.19.down_proj.weight": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.19.down_proj.weight_scale": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.19.gate_proj.weight": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.19.gate_proj.weight_scale": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.19.up_proj.weight": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.19.up_proj.weight_scale": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.2.down_proj.weight": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.2.down_proj.weight_scale": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.2.gate_proj.weight": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.2.gate_proj.weight_scale": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.2.up_proj.weight": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.2.up_proj.weight_scale": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.20.down_proj.weight": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.20.down_proj.weight_scale": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.20.gate_proj.weight": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.20.gate_proj.weight_scale": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.20.up_proj.weight": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.20.up_proj.weight_scale": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.21.down_proj.weight": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.21.down_proj.weight_scale": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.21.gate_proj.weight": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.21.gate_proj.weight_scale": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.21.up_proj.weight": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.21.up_proj.weight_scale": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.22.down_proj.weight": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.22.down_proj.weight_scale": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.22.gate_proj.weight": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.22.gate_proj.weight_scale": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.22.up_proj.weight": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.22.up_proj.weight_scale": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.23.down_proj.weight": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.23.down_proj.weight_scale": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.23.gate_proj.weight": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.23.gate_proj.weight_scale": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.23.up_proj.weight": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.23.up_proj.weight_scale": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.24.down_proj.weight": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.24.down_proj.weight_scale": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.24.gate_proj.weight": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.24.gate_proj.weight_scale": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.24.up_proj.weight": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.24.up_proj.weight_scale": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.25.down_proj.weight": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.25.down_proj.weight_scale": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.25.gate_proj.weight": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.25.gate_proj.weight_scale": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.25.up_proj.weight": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.25.up_proj.weight_scale": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.26.down_proj.weight": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.26.down_proj.weight_scale": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.26.gate_proj.weight": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.26.gate_proj.weight_scale": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.26.up_proj.weight": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.26.up_proj.weight_scale": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.27.down_proj.weight": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.27.down_proj.weight_scale": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.27.gate_proj.weight": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.27.gate_proj.weight_scale": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.27.up_proj.weight": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.27.up_proj.weight_scale": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.28.down_proj.weight": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.28.down_proj.weight_scale": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.28.gate_proj.weight": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.28.gate_proj.weight_scale": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.28.up_proj.weight": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.28.up_proj.weight_scale": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.29.down_proj.weight": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.29.down_proj.weight_scale": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.29.gate_proj.weight": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.29.gate_proj.weight_scale": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.29.up_proj.weight": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.29.up_proj.weight_scale": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.3.down_proj.weight": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.3.down_proj.weight_scale": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.3.gate_proj.weight": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.3.gate_proj.weight_scale": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.3.up_proj.weight": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.3.up_proj.weight_scale": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.30.down_proj.weight": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.30.down_proj.weight_scale": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.30.gate_proj.weight": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.30.gate_proj.weight_scale": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.30.up_proj.weight": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.30.up_proj.weight_scale": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.31.down_proj.weight": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.31.down_proj.weight_scale": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.31.gate_proj.weight": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.31.gate_proj.weight_scale": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.31.up_proj.weight": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.31.up_proj.weight_scale": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.32.down_proj.weight": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.32.down_proj.weight_scale": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.32.gate_proj.weight": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.32.gate_proj.weight_scale": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.32.up_proj.weight": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.32.up_proj.weight_scale": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.33.down_proj.weight": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.33.down_proj.weight_scale": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.33.gate_proj.weight": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.33.gate_proj.weight_scale": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.33.up_proj.weight": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.33.up_proj.weight_scale": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.34.down_proj.weight": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.34.down_proj.weight_scale": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.34.gate_proj.weight": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.34.gate_proj.weight_scale": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.34.up_proj.weight": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.34.up_proj.weight_scale": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.35.down_proj.weight": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.35.down_proj.weight_scale": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.35.gate_proj.weight": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.35.gate_proj.weight_scale": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.35.up_proj.weight": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.35.up_proj.weight_scale": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.36.down_proj.weight": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.36.down_proj.weight_scale": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.36.gate_proj.weight": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.36.gate_proj.weight_scale": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.36.up_proj.weight": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.36.up_proj.weight_scale": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.37.down_proj.weight": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.37.down_proj.weight_scale": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.37.gate_proj.weight": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.37.gate_proj.weight_scale": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.37.up_proj.weight": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.37.up_proj.weight_scale": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.38.down_proj.weight": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.38.down_proj.weight_scale": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.38.gate_proj.weight": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.38.gate_proj.weight_scale": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.38.up_proj.weight": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.38.up_proj.weight_scale": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.39.down_proj.weight": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.39.down_proj.weight_scale": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.39.gate_proj.weight": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.39.gate_proj.weight_scale": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.39.up_proj.weight": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.39.up_proj.weight_scale": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.4.down_proj.weight": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.4.down_proj.weight_scale": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.4.gate_proj.weight": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.4.gate_proj.weight_scale": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.4.up_proj.weight": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.4.up_proj.weight_scale": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.40.down_proj.weight": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.40.down_proj.weight_scale": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.40.gate_proj.weight": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.40.gate_proj.weight_scale": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.40.up_proj.weight": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.40.up_proj.weight_scale": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.41.down_proj.weight": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.41.down_proj.weight_scale": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.41.gate_proj.weight": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.41.gate_proj.weight_scale": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.41.up_proj.weight": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.41.up_proj.weight_scale": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.42.down_proj.weight": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.42.down_proj.weight_scale": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.42.gate_proj.weight": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.42.gate_proj.weight_scale": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.42.up_proj.weight": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.42.up_proj.weight_scale": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.43.down_proj.weight": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.43.down_proj.weight_scale": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.43.gate_proj.weight": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.43.gate_proj.weight_scale": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.43.up_proj.weight": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.43.up_proj.weight_scale": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.44.down_proj.weight": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.44.down_proj.weight_scale": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.44.gate_proj.weight": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.44.gate_proj.weight_scale": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.44.up_proj.weight": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.44.up_proj.weight_scale": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.45.down_proj.weight": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.45.down_proj.weight_scale": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.45.gate_proj.weight": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.45.gate_proj.weight_scale": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.45.up_proj.weight": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.45.up_proj.weight_scale": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.46.down_proj.weight": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.46.down_proj.weight_scale": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.46.gate_proj.weight": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.46.gate_proj.weight_scale": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.46.up_proj.weight": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.46.up_proj.weight_scale": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.47.down_proj.weight": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.47.down_proj.weight_scale": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.47.gate_proj.weight": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.47.gate_proj.weight_scale": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.47.up_proj.weight": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.47.up_proj.weight_scale": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.48.down_proj.weight": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.48.down_proj.weight_scale": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.48.gate_proj.weight": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.48.gate_proj.weight_scale": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.48.up_proj.weight": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.48.up_proj.weight_scale": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.49.down_proj.weight": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.49.down_proj.weight_scale": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.49.gate_proj.weight": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.49.gate_proj.weight_scale": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.49.up_proj.weight": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.49.up_proj.weight_scale": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.5.down_proj.weight": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.5.down_proj.weight_scale": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.5.gate_proj.weight": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.5.gate_proj.weight_scale": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.5.up_proj.weight": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.5.up_proj.weight_scale": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.50.down_proj.weight": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.50.down_proj.weight_scale": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.50.gate_proj.weight": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.50.gate_proj.weight_scale": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.50.up_proj.weight": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.50.up_proj.weight_scale": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.51.down_proj.weight": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.51.down_proj.weight_scale": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.51.gate_proj.weight": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.51.gate_proj.weight_scale": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.51.up_proj.weight": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.51.up_proj.weight_scale": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.52.down_proj.weight": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.52.down_proj.weight_scale": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.52.gate_proj.weight": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.52.gate_proj.weight_scale": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.52.up_proj.weight": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.52.up_proj.weight_scale": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.53.down_proj.weight": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.53.down_proj.weight_scale": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.53.gate_proj.weight": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.53.gate_proj.weight_scale": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.53.up_proj.weight": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.53.up_proj.weight_scale": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.54.down_proj.weight": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.54.down_proj.weight_scale": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.54.gate_proj.weight": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.54.gate_proj.weight_scale": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.54.up_proj.weight": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.54.up_proj.weight_scale": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.55.down_proj.weight": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.55.down_proj.weight_scale": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.55.gate_proj.weight": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.55.gate_proj.weight_scale": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.55.up_proj.weight": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.55.up_proj.weight_scale": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.56.down_proj.weight": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.56.down_proj.weight_scale": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.56.gate_proj.weight": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.56.gate_proj.weight_scale": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.56.up_proj.weight": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.56.up_proj.weight_scale": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.57.down_proj.weight": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.57.down_proj.weight_scale": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.57.gate_proj.weight": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.57.gate_proj.weight_scale": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.57.up_proj.weight": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.57.up_proj.weight_scale": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.58.down_proj.weight": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.58.down_proj.weight_scale": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.58.gate_proj.weight": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.58.gate_proj.weight_scale": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.58.up_proj.weight": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.58.up_proj.weight_scale": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.59.down_proj.weight": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.59.down_proj.weight_scale": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.59.gate_proj.weight": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.59.gate_proj.weight_scale": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.59.up_proj.weight": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.59.up_proj.weight_scale": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.6.down_proj.weight": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.6.down_proj.weight_scale": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.6.gate_proj.weight": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.6.gate_proj.weight_scale": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.6.up_proj.weight": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.6.up_proj.weight_scale": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.60.down_proj.weight": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.60.down_proj.weight_scale": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.60.gate_proj.weight": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.60.gate_proj.weight_scale": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.60.up_proj.weight": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.60.up_proj.weight_scale": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.61.down_proj.weight": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.61.down_proj.weight_scale": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.61.gate_proj.weight": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.61.gate_proj.weight_scale": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.61.up_proj.weight": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.61.up_proj.weight_scale": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.62.down_proj.weight": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.62.down_proj.weight_scale": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.62.gate_proj.weight": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.62.gate_proj.weight_scale": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.62.up_proj.weight": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.62.up_proj.weight_scale": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.63.down_proj.weight": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.63.down_proj.weight_scale": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.63.gate_proj.weight": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.63.gate_proj.weight_scale": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.63.up_proj.weight": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.63.up_proj.weight_scale": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.64.down_proj.weight": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.64.down_proj.weight_scale": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.64.gate_proj.weight": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.64.gate_proj.weight_scale": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.64.up_proj.weight": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.64.up_proj.weight_scale": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.65.down_proj.weight": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.65.down_proj.weight_scale": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.65.gate_proj.weight": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.65.gate_proj.weight_scale": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.65.up_proj.weight": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.65.up_proj.weight_scale": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.66.down_proj.weight": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.66.down_proj.weight_scale": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.66.gate_proj.weight": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.66.gate_proj.weight_scale": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.66.up_proj.weight": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.66.up_proj.weight_scale": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.67.down_proj.weight": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.67.down_proj.weight_scale": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.67.gate_proj.weight": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.67.gate_proj.weight_scale": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.67.up_proj.weight": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.67.up_proj.weight_scale": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.68.down_proj.weight": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.68.down_proj.weight_scale": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.68.gate_proj.weight": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.68.gate_proj.weight_scale": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.68.up_proj.weight": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.68.up_proj.weight_scale": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.69.down_proj.weight": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.69.down_proj.weight_scale": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.69.gate_proj.weight": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.69.gate_proj.weight_scale": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.69.up_proj.weight": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.69.up_proj.weight_scale": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.7.down_proj.weight": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.7.down_proj.weight_scale": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.7.gate_proj.weight": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.7.gate_proj.weight_scale": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.7.up_proj.weight": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.7.up_proj.weight_scale": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.70.down_proj.weight": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.70.down_proj.weight_scale": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.70.gate_proj.weight": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.70.gate_proj.weight_scale": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.70.up_proj.weight": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.70.up_proj.weight_scale": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.71.down_proj.weight": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.71.down_proj.weight_scale": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.71.gate_proj.weight": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.71.gate_proj.weight_scale": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.71.up_proj.weight": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.71.up_proj.weight_scale": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.72.down_proj.weight": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.72.down_proj.weight_scale": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.72.gate_proj.weight": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.72.gate_proj.weight_scale": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.72.up_proj.weight": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.72.up_proj.weight_scale": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.73.down_proj.weight": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.73.down_proj.weight_scale": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.73.gate_proj.weight": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.73.gate_proj.weight_scale": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.73.up_proj.weight": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.73.up_proj.weight_scale": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.74.down_proj.weight": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.74.down_proj.weight_scale": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.74.gate_proj.weight": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.74.gate_proj.weight_scale": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.74.up_proj.weight": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.74.up_proj.weight_scale": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.75.down_proj.weight": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.75.down_proj.weight_scale": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.75.gate_proj.weight": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.75.gate_proj.weight_scale": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.75.up_proj.weight": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.75.up_proj.weight_scale": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.76.down_proj.weight": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.76.down_proj.weight_scale": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.76.gate_proj.weight": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.76.gate_proj.weight_scale": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.76.up_proj.weight": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.76.up_proj.weight_scale": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.77.down_proj.weight": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.77.down_proj.weight_scale": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.77.gate_proj.weight": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.77.gate_proj.weight_scale": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.77.up_proj.weight": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.77.up_proj.weight_scale": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.78.down_proj.weight": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.78.down_proj.weight_scale": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.78.gate_proj.weight": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.78.gate_proj.weight_scale": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.78.up_proj.weight": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.78.up_proj.weight_scale": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.79.down_proj.weight": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.79.down_proj.weight_scale": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.79.gate_proj.weight": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.79.gate_proj.weight_scale": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.79.up_proj.weight": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.79.up_proj.weight_scale": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.8.down_proj.weight": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.8.down_proj.weight_scale": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.8.gate_proj.weight": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.8.gate_proj.weight_scale": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.8.up_proj.weight": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.8.up_proj.weight_scale": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.80.down_proj.weight": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.80.down_proj.weight_scale": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.80.gate_proj.weight": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.80.gate_proj.weight_scale": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.80.up_proj.weight": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.80.up_proj.weight_scale": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.81.down_proj.weight": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.81.down_proj.weight_scale": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.81.gate_proj.weight": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.81.gate_proj.weight_scale": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.81.up_proj.weight": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.81.up_proj.weight_scale": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.82.down_proj.weight": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.82.down_proj.weight_scale": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.82.gate_proj.weight": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.82.gate_proj.weight_scale": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.82.up_proj.weight": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.82.up_proj.weight_scale": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.83.down_proj.weight": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.83.down_proj.weight_scale": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.83.gate_proj.weight": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.83.gate_proj.weight_scale": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.83.up_proj.weight": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.83.up_proj.weight_scale": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.84.down_proj.weight": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.84.down_proj.weight_scale": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.84.gate_proj.weight": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.84.gate_proj.weight_scale": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.84.up_proj.weight": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.84.up_proj.weight_scale": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.85.down_proj.weight": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.85.down_proj.weight_scale": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.85.gate_proj.weight": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.85.gate_proj.weight_scale": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.85.up_proj.weight": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.85.up_proj.weight_scale": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.86.down_proj.weight": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.86.down_proj.weight_scale": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.86.gate_proj.weight": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.86.gate_proj.weight_scale": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.86.up_proj.weight": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.86.up_proj.weight_scale": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.87.down_proj.weight": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.87.down_proj.weight_scale": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.87.gate_proj.weight": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.87.gate_proj.weight_scale": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.87.up_proj.weight": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.87.up_proj.weight_scale": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.88.down_proj.weight": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.88.down_proj.weight_scale": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.88.gate_proj.weight": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.88.gate_proj.weight_scale": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.88.up_proj.weight": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.88.up_proj.weight_scale": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.89.down_proj.weight": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.89.down_proj.weight_scale": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.89.gate_proj.weight": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.89.gate_proj.weight_scale": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.89.up_proj.weight": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.89.up_proj.weight_scale": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.9.down_proj.weight": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.9.down_proj.weight_scale": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.9.gate_proj.weight": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.9.gate_proj.weight_scale": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.9.up_proj.weight": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.9.up_proj.weight_scale": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.90.down_proj.weight": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.90.down_proj.weight_scale": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.90.gate_proj.weight": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.90.gate_proj.weight_scale": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.90.up_proj.weight": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.90.up_proj.weight_scale": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.91.down_proj.weight": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.91.down_proj.weight_scale": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.91.gate_proj.weight": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.91.gate_proj.weight_scale": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.91.up_proj.weight": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.91.up_proj.weight_scale": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.92.down_proj.weight": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.92.down_proj.weight_scale": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.92.gate_proj.weight": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.92.gate_proj.weight_scale": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.92.up_proj.weight": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.92.up_proj.weight_scale": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.93.down_proj.weight": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.93.down_proj.weight_scale": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.93.gate_proj.weight": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.93.gate_proj.weight_scale": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.93.up_proj.weight": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.93.up_proj.weight_scale": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.94.down_proj.weight": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.94.down_proj.weight_scale": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.94.gate_proj.weight": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.94.gate_proj.weight_scale": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.94.up_proj.weight": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.94.up_proj.weight_scale": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.95.down_proj.weight": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.95.down_proj.weight_scale": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.95.gate_proj.weight": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.95.gate_proj.weight_scale": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.95.up_proj.weight": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.95.up_proj.weight_scale": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.96.down_proj.weight": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.96.down_proj.weight_scale": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.96.gate_proj.weight": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.96.gate_proj.weight_scale": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.96.up_proj.weight": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.96.up_proj.weight_scale": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.97.down_proj.weight": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.97.down_proj.weight_scale": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.97.gate_proj.weight": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.97.gate_proj.weight_scale": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.97.up_proj.weight": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.97.up_proj.weight_scale": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.98.down_proj.weight": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.98.down_proj.weight_scale": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.98.gate_proj.weight": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.98.gate_proj.weight_scale": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.98.up_proj.weight": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.98.up_proj.weight_scale": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.99.down_proj.weight": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.99.down_proj.weight_scale": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.99.gate_proj.weight": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.99.gate_proj.weight_scale": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.99.up_proj.weight": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.99.up_proj.weight_scale": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.gate.e_score_correction_bias": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.gate.weight": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.shared_experts.down_proj.weight": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.shared_experts.down_proj.weight_scale": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.shared_experts.gate_proj.weight": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.shared_experts.gate_proj.weight_scale": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.shared_experts.up_proj.weight": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.shared_experts.up_proj.weight_scale": "model-00065-of-00092.safetensors",
+ "model.layers.64.post_attention_layernorm.weight": "model-00065-of-00092.safetensors",
+ "model.layers.64.self_attn.k_norm.weight": "model-00065-of-00092.safetensors",
+ "model.layers.64.self_attn.k_proj.bias": "model-00065-of-00092.safetensors",
+ "model.layers.64.self_attn.k_proj.weight": "model-00065-of-00092.safetensors",
+ "model.layers.64.self_attn.k_proj.weight_scale": "model-00065-of-00092.safetensors",
+ "model.layers.64.self_attn.o_proj.weight": "model-00065-of-00092.safetensors",
+ "model.layers.64.self_attn.o_proj.weight_scale": "model-00065-of-00092.safetensors",
+ "model.layers.64.self_attn.q_norm.weight": "model-00065-of-00092.safetensors",
+ "model.layers.64.self_attn.q_proj.bias": "model-00065-of-00092.safetensors",
+ "model.layers.64.self_attn.q_proj.weight": "model-00065-of-00092.safetensors",
+ "model.layers.64.self_attn.q_proj.weight_scale": "model-00065-of-00092.safetensors",
+ "model.layers.64.self_attn.v_proj.bias": "model-00065-of-00092.safetensors",
+ "model.layers.64.self_attn.v_proj.weight": "model-00065-of-00092.safetensors",
+ "model.layers.64.self_attn.v_proj.weight_scale": "model-00065-of-00092.safetensors",
+ "model.layers.65.input_layernorm.weight": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.0.down_proj.weight": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.0.down_proj.weight_scale": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.0.gate_proj.weight": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.0.gate_proj.weight_scale": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.0.up_proj.weight": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.0.up_proj.weight_scale": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.1.down_proj.weight": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.1.down_proj.weight_scale": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.1.gate_proj.weight": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.1.gate_proj.weight_scale": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.1.up_proj.weight": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.1.up_proj.weight_scale": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.10.down_proj.weight": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.10.down_proj.weight_scale": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.10.gate_proj.weight": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.10.gate_proj.weight_scale": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.10.up_proj.weight": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.10.up_proj.weight_scale": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.100.down_proj.weight": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.100.down_proj.weight_scale": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.100.gate_proj.weight": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.100.gate_proj.weight_scale": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.100.up_proj.weight": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.100.up_proj.weight_scale": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.101.down_proj.weight": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.101.down_proj.weight_scale": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.101.gate_proj.weight": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.101.gate_proj.weight_scale": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.101.up_proj.weight": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.101.up_proj.weight_scale": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.102.down_proj.weight": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.102.down_proj.weight_scale": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.102.gate_proj.weight": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.102.gate_proj.weight_scale": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.102.up_proj.weight": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.102.up_proj.weight_scale": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.103.down_proj.weight": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.103.down_proj.weight_scale": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.103.gate_proj.weight": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.103.gate_proj.weight_scale": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.103.up_proj.weight": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.103.up_proj.weight_scale": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.104.down_proj.weight": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.104.down_proj.weight_scale": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.104.gate_proj.weight": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.104.gate_proj.weight_scale": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.104.up_proj.weight": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.104.up_proj.weight_scale": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.105.down_proj.weight": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.105.down_proj.weight_scale": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.105.gate_proj.weight": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.105.gate_proj.weight_scale": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.105.up_proj.weight": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.105.up_proj.weight_scale": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.106.down_proj.weight": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.106.down_proj.weight_scale": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.106.gate_proj.weight": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.106.gate_proj.weight_scale": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.106.up_proj.weight": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.106.up_proj.weight_scale": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.107.down_proj.weight": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.107.down_proj.weight_scale": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.107.gate_proj.weight": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.107.gate_proj.weight_scale": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.107.up_proj.weight": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.107.up_proj.weight_scale": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.108.down_proj.weight": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.108.down_proj.weight_scale": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.108.gate_proj.weight": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.108.gate_proj.weight_scale": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.108.up_proj.weight": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.108.up_proj.weight_scale": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.109.down_proj.weight": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.109.down_proj.weight_scale": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.109.gate_proj.weight": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.109.gate_proj.weight_scale": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.109.up_proj.weight": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.109.up_proj.weight_scale": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.11.down_proj.weight": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.11.down_proj.weight_scale": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.11.gate_proj.weight": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.11.gate_proj.weight_scale": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.11.up_proj.weight": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.11.up_proj.weight_scale": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.110.down_proj.weight": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.110.down_proj.weight_scale": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.110.gate_proj.weight": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.110.gate_proj.weight_scale": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.110.up_proj.weight": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.110.up_proj.weight_scale": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.111.down_proj.weight": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.111.down_proj.weight_scale": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.111.gate_proj.weight": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.111.gate_proj.weight_scale": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.111.up_proj.weight": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.111.up_proj.weight_scale": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.112.down_proj.weight": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.112.down_proj.weight_scale": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.112.gate_proj.weight": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.112.gate_proj.weight_scale": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.112.up_proj.weight": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.112.up_proj.weight_scale": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.113.down_proj.weight": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.113.down_proj.weight_scale": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.113.gate_proj.weight": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.113.gate_proj.weight_scale": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.113.up_proj.weight": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.113.up_proj.weight_scale": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.114.down_proj.weight": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.114.down_proj.weight_scale": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.114.gate_proj.weight": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.114.gate_proj.weight_scale": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.114.up_proj.weight": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.114.up_proj.weight_scale": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.115.down_proj.weight": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.115.down_proj.weight_scale": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.115.gate_proj.weight": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.115.gate_proj.weight_scale": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.115.up_proj.weight": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.115.up_proj.weight_scale": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.116.down_proj.weight": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.116.down_proj.weight_scale": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.116.gate_proj.weight": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.116.gate_proj.weight_scale": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.116.up_proj.weight": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.116.up_proj.weight_scale": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.117.down_proj.weight": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.117.down_proj.weight_scale": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.117.gate_proj.weight": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.117.gate_proj.weight_scale": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.117.up_proj.weight": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.117.up_proj.weight_scale": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.118.down_proj.weight": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.118.down_proj.weight_scale": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.118.gate_proj.weight": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.118.gate_proj.weight_scale": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.118.up_proj.weight": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.118.up_proj.weight_scale": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.119.down_proj.weight": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.119.down_proj.weight_scale": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.119.gate_proj.weight": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.119.gate_proj.weight_scale": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.119.up_proj.weight": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.119.up_proj.weight_scale": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.12.down_proj.weight": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.12.down_proj.weight_scale": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.12.gate_proj.weight": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.12.gate_proj.weight_scale": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.12.up_proj.weight": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.12.up_proj.weight_scale": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.120.down_proj.weight": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.120.down_proj.weight_scale": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.120.gate_proj.weight": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.120.gate_proj.weight_scale": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.120.up_proj.weight": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.120.up_proj.weight_scale": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.121.down_proj.weight": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.121.down_proj.weight_scale": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.121.gate_proj.weight": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.121.gate_proj.weight_scale": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.121.up_proj.weight": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.121.up_proj.weight_scale": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.122.down_proj.weight": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.122.down_proj.weight_scale": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.122.gate_proj.weight": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.122.gate_proj.weight_scale": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.122.up_proj.weight": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.122.up_proj.weight_scale": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.123.down_proj.weight": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.123.down_proj.weight_scale": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.123.gate_proj.weight": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.123.gate_proj.weight_scale": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.123.up_proj.weight": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.123.up_proj.weight_scale": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.124.down_proj.weight": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.124.down_proj.weight_scale": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.124.gate_proj.weight": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.124.gate_proj.weight_scale": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.124.up_proj.weight": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.124.up_proj.weight_scale": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.125.down_proj.weight": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.125.down_proj.weight_scale": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.125.gate_proj.weight": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.125.gate_proj.weight_scale": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.125.up_proj.weight": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.125.up_proj.weight_scale": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.126.down_proj.weight": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.126.down_proj.weight_scale": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.126.gate_proj.weight": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.126.gate_proj.weight_scale": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.126.up_proj.weight": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.126.up_proj.weight_scale": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.127.down_proj.weight": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.127.down_proj.weight_scale": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.127.gate_proj.weight": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.127.gate_proj.weight_scale": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.127.up_proj.weight": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.127.up_proj.weight_scale": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.128.down_proj.weight": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.128.down_proj.weight_scale": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.128.gate_proj.weight": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.128.gate_proj.weight_scale": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.128.up_proj.weight": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.128.up_proj.weight_scale": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.129.down_proj.weight": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.129.down_proj.weight_scale": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.129.gate_proj.weight": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.129.gate_proj.weight_scale": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.129.up_proj.weight": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.129.up_proj.weight_scale": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.13.down_proj.weight": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.13.down_proj.weight_scale": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.13.gate_proj.weight": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.13.gate_proj.weight_scale": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.13.up_proj.weight": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.13.up_proj.weight_scale": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.130.down_proj.weight": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.130.down_proj.weight_scale": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.130.gate_proj.weight": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.130.gate_proj.weight_scale": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.130.up_proj.weight": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.130.up_proj.weight_scale": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.131.down_proj.weight": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.131.down_proj.weight_scale": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.131.gate_proj.weight": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.131.gate_proj.weight_scale": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.131.up_proj.weight": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.131.up_proj.weight_scale": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.132.down_proj.weight": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.132.down_proj.weight_scale": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.132.gate_proj.weight": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.132.gate_proj.weight_scale": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.132.up_proj.weight": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.132.up_proj.weight_scale": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.133.down_proj.weight": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.133.down_proj.weight_scale": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.133.gate_proj.weight": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.133.gate_proj.weight_scale": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.133.up_proj.weight": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.133.up_proj.weight_scale": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.134.down_proj.weight": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.134.down_proj.weight_scale": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.134.gate_proj.weight": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.134.gate_proj.weight_scale": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.134.up_proj.weight": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.134.up_proj.weight_scale": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.135.down_proj.weight": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.135.down_proj.weight_scale": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.135.gate_proj.weight": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.135.gate_proj.weight_scale": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.135.up_proj.weight": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.135.up_proj.weight_scale": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.136.down_proj.weight": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.136.down_proj.weight_scale": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.136.gate_proj.weight": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.136.gate_proj.weight_scale": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.136.up_proj.weight": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.136.up_proj.weight_scale": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.137.down_proj.weight": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.137.down_proj.weight_scale": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.137.gate_proj.weight": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.137.gate_proj.weight_scale": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.137.up_proj.weight": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.137.up_proj.weight_scale": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.138.down_proj.weight": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.138.down_proj.weight_scale": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.138.gate_proj.weight": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.138.gate_proj.weight_scale": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.138.up_proj.weight": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.138.up_proj.weight_scale": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.139.down_proj.weight": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.139.down_proj.weight_scale": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.139.gate_proj.weight": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.139.gate_proj.weight_scale": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.139.up_proj.weight": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.139.up_proj.weight_scale": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.14.down_proj.weight": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.14.down_proj.weight_scale": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.14.gate_proj.weight": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.14.gate_proj.weight_scale": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.14.up_proj.weight": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.14.up_proj.weight_scale": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.140.down_proj.weight": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.140.down_proj.weight_scale": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.140.gate_proj.weight": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.140.gate_proj.weight_scale": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.140.up_proj.weight": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.140.up_proj.weight_scale": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.141.down_proj.weight": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.141.down_proj.weight_scale": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.141.gate_proj.weight": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.141.gate_proj.weight_scale": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.141.up_proj.weight": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.141.up_proj.weight_scale": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.142.down_proj.weight": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.142.down_proj.weight_scale": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.142.gate_proj.weight": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.142.gate_proj.weight_scale": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.142.up_proj.weight": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.142.up_proj.weight_scale": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.143.down_proj.weight": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.143.down_proj.weight_scale": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.143.gate_proj.weight": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.143.gate_proj.weight_scale": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.143.up_proj.weight": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.143.up_proj.weight_scale": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.144.down_proj.weight": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.144.down_proj.weight_scale": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.144.gate_proj.weight": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.144.gate_proj.weight_scale": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.144.up_proj.weight": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.144.up_proj.weight_scale": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.145.down_proj.weight": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.145.down_proj.weight_scale": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.145.gate_proj.weight": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.145.gate_proj.weight_scale": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.145.up_proj.weight": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.145.up_proj.weight_scale": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.146.down_proj.weight": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.146.down_proj.weight_scale": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.146.gate_proj.weight": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.146.gate_proj.weight_scale": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.146.up_proj.weight": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.146.up_proj.weight_scale": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.147.down_proj.weight": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.147.down_proj.weight_scale": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.147.gate_proj.weight": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.147.gate_proj.weight_scale": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.147.up_proj.weight": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.147.up_proj.weight_scale": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.148.down_proj.weight": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.148.down_proj.weight_scale": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.148.gate_proj.weight": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.148.gate_proj.weight_scale": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.148.up_proj.weight": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.148.up_proj.weight_scale": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.149.down_proj.weight": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.149.down_proj.weight_scale": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.149.gate_proj.weight": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.149.gate_proj.weight_scale": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.149.up_proj.weight": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.149.up_proj.weight_scale": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.15.down_proj.weight": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.15.down_proj.weight_scale": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.15.gate_proj.weight": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.15.gate_proj.weight_scale": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.15.up_proj.weight": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.15.up_proj.weight_scale": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.150.down_proj.weight": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.150.down_proj.weight_scale": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.150.gate_proj.weight": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.150.gate_proj.weight_scale": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.150.up_proj.weight": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.150.up_proj.weight_scale": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.151.down_proj.weight": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.151.down_proj.weight_scale": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.151.gate_proj.weight": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.151.gate_proj.weight_scale": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.151.up_proj.weight": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.151.up_proj.weight_scale": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.152.down_proj.weight": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.152.down_proj.weight_scale": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.152.gate_proj.weight": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.152.gate_proj.weight_scale": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.152.up_proj.weight": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.152.up_proj.weight_scale": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.153.down_proj.weight": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.153.down_proj.weight_scale": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.153.gate_proj.weight": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.153.gate_proj.weight_scale": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.153.up_proj.weight": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.153.up_proj.weight_scale": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.154.down_proj.weight": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.154.down_proj.weight_scale": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.154.gate_proj.weight": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.154.gate_proj.weight_scale": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.154.up_proj.weight": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.154.up_proj.weight_scale": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.155.down_proj.weight": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.155.down_proj.weight_scale": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.155.gate_proj.weight": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.155.gate_proj.weight_scale": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.155.up_proj.weight": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.155.up_proj.weight_scale": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.156.down_proj.weight": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.156.down_proj.weight_scale": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.156.gate_proj.weight": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.156.gate_proj.weight_scale": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.156.up_proj.weight": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.156.up_proj.weight_scale": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.157.down_proj.weight": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.157.down_proj.weight_scale": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.157.gate_proj.weight": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.157.gate_proj.weight_scale": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.157.up_proj.weight": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.157.up_proj.weight_scale": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.158.down_proj.weight": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.158.down_proj.weight_scale": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.158.gate_proj.weight": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.158.gate_proj.weight_scale": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.158.up_proj.weight": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.158.up_proj.weight_scale": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.159.down_proj.weight": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.159.down_proj.weight_scale": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.159.gate_proj.weight": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.159.gate_proj.weight_scale": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.159.up_proj.weight": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.159.up_proj.weight_scale": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.16.down_proj.weight": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.16.down_proj.weight_scale": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.16.gate_proj.weight": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.16.gate_proj.weight_scale": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.16.up_proj.weight": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.16.up_proj.weight_scale": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.17.down_proj.weight": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.17.down_proj.weight_scale": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.17.gate_proj.weight": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.17.gate_proj.weight_scale": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.17.up_proj.weight": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.17.up_proj.weight_scale": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.18.down_proj.weight": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.18.down_proj.weight_scale": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.18.gate_proj.weight": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.18.gate_proj.weight_scale": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.18.up_proj.weight": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.18.up_proj.weight_scale": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.19.down_proj.weight": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.19.down_proj.weight_scale": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.19.gate_proj.weight": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.19.gate_proj.weight_scale": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.19.up_proj.weight": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.19.up_proj.weight_scale": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.2.down_proj.weight": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.2.down_proj.weight_scale": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.2.gate_proj.weight": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.2.gate_proj.weight_scale": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.2.up_proj.weight": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.2.up_proj.weight_scale": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.20.down_proj.weight": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.20.down_proj.weight_scale": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.20.gate_proj.weight": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.20.gate_proj.weight_scale": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.20.up_proj.weight": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.20.up_proj.weight_scale": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.21.down_proj.weight": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.21.down_proj.weight_scale": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.21.gate_proj.weight": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.21.gate_proj.weight_scale": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.21.up_proj.weight": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.21.up_proj.weight_scale": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.22.down_proj.weight": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.22.down_proj.weight_scale": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.22.gate_proj.weight": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.22.gate_proj.weight_scale": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.22.up_proj.weight": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.22.up_proj.weight_scale": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.23.down_proj.weight": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.23.down_proj.weight_scale": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.23.gate_proj.weight": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.23.gate_proj.weight_scale": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.23.up_proj.weight": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.23.up_proj.weight_scale": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.24.down_proj.weight": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.24.down_proj.weight_scale": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.24.gate_proj.weight": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.24.gate_proj.weight_scale": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.24.up_proj.weight": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.24.up_proj.weight_scale": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.25.down_proj.weight": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.25.down_proj.weight_scale": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.25.gate_proj.weight": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.25.gate_proj.weight_scale": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.25.up_proj.weight": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.25.up_proj.weight_scale": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.26.down_proj.weight": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.26.down_proj.weight_scale": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.26.gate_proj.weight": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.26.gate_proj.weight_scale": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.26.up_proj.weight": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.26.up_proj.weight_scale": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.27.down_proj.weight": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.27.down_proj.weight_scale": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.27.gate_proj.weight": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.27.gate_proj.weight_scale": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.27.up_proj.weight": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.27.up_proj.weight_scale": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.28.down_proj.weight": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.28.down_proj.weight_scale": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.28.gate_proj.weight": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.28.gate_proj.weight_scale": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.28.up_proj.weight": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.28.up_proj.weight_scale": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.29.down_proj.weight": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.29.down_proj.weight_scale": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.29.gate_proj.weight": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.29.gate_proj.weight_scale": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.29.up_proj.weight": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.29.up_proj.weight_scale": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.3.down_proj.weight": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.3.down_proj.weight_scale": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.3.gate_proj.weight": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.3.gate_proj.weight_scale": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.3.up_proj.weight": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.3.up_proj.weight_scale": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.30.down_proj.weight": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.30.down_proj.weight_scale": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.30.gate_proj.weight": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.30.gate_proj.weight_scale": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.30.up_proj.weight": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.30.up_proj.weight_scale": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.31.down_proj.weight": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.31.down_proj.weight_scale": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.31.gate_proj.weight": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.31.gate_proj.weight_scale": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.31.up_proj.weight": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.31.up_proj.weight_scale": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.32.down_proj.weight": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.32.down_proj.weight_scale": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.32.gate_proj.weight": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.32.gate_proj.weight_scale": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.32.up_proj.weight": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.32.up_proj.weight_scale": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.33.down_proj.weight": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.33.down_proj.weight_scale": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.33.gate_proj.weight": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.33.gate_proj.weight_scale": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.33.up_proj.weight": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.33.up_proj.weight_scale": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.34.down_proj.weight": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.34.down_proj.weight_scale": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.34.gate_proj.weight": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.34.gate_proj.weight_scale": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.34.up_proj.weight": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.34.up_proj.weight_scale": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.35.down_proj.weight": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.35.down_proj.weight_scale": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.35.gate_proj.weight": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.35.gate_proj.weight_scale": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.35.up_proj.weight": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.35.up_proj.weight_scale": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.36.down_proj.weight": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.36.down_proj.weight_scale": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.36.gate_proj.weight": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.36.gate_proj.weight_scale": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.36.up_proj.weight": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.36.up_proj.weight_scale": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.37.down_proj.weight": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.37.down_proj.weight_scale": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.37.gate_proj.weight": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.37.gate_proj.weight_scale": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.37.up_proj.weight": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.37.up_proj.weight_scale": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.38.down_proj.weight": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.38.down_proj.weight_scale": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.38.gate_proj.weight": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.38.gate_proj.weight_scale": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.38.up_proj.weight": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.38.up_proj.weight_scale": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.39.down_proj.weight": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.39.down_proj.weight_scale": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.39.gate_proj.weight": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.39.gate_proj.weight_scale": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.39.up_proj.weight": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.39.up_proj.weight_scale": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.4.down_proj.weight": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.4.down_proj.weight_scale": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.4.gate_proj.weight": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.4.gate_proj.weight_scale": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.4.up_proj.weight": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.4.up_proj.weight_scale": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.40.down_proj.weight": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.40.down_proj.weight_scale": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.40.gate_proj.weight": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.40.gate_proj.weight_scale": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.40.up_proj.weight": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.40.up_proj.weight_scale": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.41.down_proj.weight": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.41.down_proj.weight_scale": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.41.gate_proj.weight": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.41.gate_proj.weight_scale": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.41.up_proj.weight": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.41.up_proj.weight_scale": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.42.down_proj.weight": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.42.down_proj.weight_scale": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.42.gate_proj.weight": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.42.gate_proj.weight_scale": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.42.up_proj.weight": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.42.up_proj.weight_scale": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.43.down_proj.weight": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.43.down_proj.weight_scale": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.43.gate_proj.weight": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.43.gate_proj.weight_scale": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.43.up_proj.weight": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.43.up_proj.weight_scale": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.44.down_proj.weight": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.44.down_proj.weight_scale": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.44.gate_proj.weight": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.44.gate_proj.weight_scale": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.44.up_proj.weight": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.44.up_proj.weight_scale": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.45.down_proj.weight": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.45.down_proj.weight_scale": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.45.gate_proj.weight": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.45.gate_proj.weight_scale": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.45.up_proj.weight": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.45.up_proj.weight_scale": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.46.down_proj.weight": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.46.down_proj.weight_scale": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.46.gate_proj.weight": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.46.gate_proj.weight_scale": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.46.up_proj.weight": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.46.up_proj.weight_scale": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.47.down_proj.weight": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.47.down_proj.weight_scale": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.47.gate_proj.weight": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.47.gate_proj.weight_scale": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.47.up_proj.weight": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.47.up_proj.weight_scale": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.48.down_proj.weight": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.48.down_proj.weight_scale": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.48.gate_proj.weight": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.48.gate_proj.weight_scale": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.48.up_proj.weight": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.48.up_proj.weight_scale": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.49.down_proj.weight": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.49.down_proj.weight_scale": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.49.gate_proj.weight": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.49.gate_proj.weight_scale": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.49.up_proj.weight": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.49.up_proj.weight_scale": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.5.down_proj.weight": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.5.down_proj.weight_scale": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.5.gate_proj.weight": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.5.gate_proj.weight_scale": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.5.up_proj.weight": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.5.up_proj.weight_scale": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.50.down_proj.weight": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.50.down_proj.weight_scale": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.50.gate_proj.weight": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.50.gate_proj.weight_scale": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.50.up_proj.weight": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.50.up_proj.weight_scale": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.51.down_proj.weight": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.51.down_proj.weight_scale": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.51.gate_proj.weight": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.51.gate_proj.weight_scale": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.51.up_proj.weight": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.51.up_proj.weight_scale": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.52.down_proj.weight": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.52.down_proj.weight_scale": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.52.gate_proj.weight": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.52.gate_proj.weight_scale": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.52.up_proj.weight": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.52.up_proj.weight_scale": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.53.down_proj.weight": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.53.down_proj.weight_scale": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.53.gate_proj.weight": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.53.gate_proj.weight_scale": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.53.up_proj.weight": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.53.up_proj.weight_scale": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.54.down_proj.weight": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.54.down_proj.weight_scale": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.54.gate_proj.weight": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.54.gate_proj.weight_scale": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.54.up_proj.weight": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.54.up_proj.weight_scale": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.55.down_proj.weight": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.55.down_proj.weight_scale": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.55.gate_proj.weight": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.55.gate_proj.weight_scale": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.55.up_proj.weight": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.55.up_proj.weight_scale": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.56.down_proj.weight": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.56.down_proj.weight_scale": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.56.gate_proj.weight": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.56.gate_proj.weight_scale": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.56.up_proj.weight": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.56.up_proj.weight_scale": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.57.down_proj.weight": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.57.down_proj.weight_scale": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.57.gate_proj.weight": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.57.gate_proj.weight_scale": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.57.up_proj.weight": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.57.up_proj.weight_scale": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.58.down_proj.weight": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.58.down_proj.weight_scale": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.58.gate_proj.weight": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.58.gate_proj.weight_scale": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.58.up_proj.weight": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.58.up_proj.weight_scale": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.59.down_proj.weight": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.59.down_proj.weight_scale": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.59.gate_proj.weight": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.59.gate_proj.weight_scale": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.59.up_proj.weight": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.59.up_proj.weight_scale": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.6.down_proj.weight": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.6.down_proj.weight_scale": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.6.gate_proj.weight": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.6.gate_proj.weight_scale": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.6.up_proj.weight": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.6.up_proj.weight_scale": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.60.down_proj.weight": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.60.down_proj.weight_scale": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.60.gate_proj.weight": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.60.gate_proj.weight_scale": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.60.up_proj.weight": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.60.up_proj.weight_scale": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.61.down_proj.weight": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.61.down_proj.weight_scale": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.61.gate_proj.weight": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.61.gate_proj.weight_scale": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.61.up_proj.weight": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.61.up_proj.weight_scale": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.62.down_proj.weight": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.62.down_proj.weight_scale": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.62.gate_proj.weight": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.62.gate_proj.weight_scale": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.62.up_proj.weight": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.62.up_proj.weight_scale": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.63.down_proj.weight": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.63.down_proj.weight_scale": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.63.gate_proj.weight": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.63.gate_proj.weight_scale": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.63.up_proj.weight": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.63.up_proj.weight_scale": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.64.down_proj.weight": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.64.down_proj.weight_scale": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.64.gate_proj.weight": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.64.gate_proj.weight_scale": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.64.up_proj.weight": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.64.up_proj.weight_scale": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.65.down_proj.weight": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.65.down_proj.weight_scale": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.65.gate_proj.weight": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.65.gate_proj.weight_scale": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.65.up_proj.weight": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.65.up_proj.weight_scale": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.66.down_proj.weight": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.66.down_proj.weight_scale": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.66.gate_proj.weight": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.66.gate_proj.weight_scale": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.66.up_proj.weight": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.66.up_proj.weight_scale": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.67.down_proj.weight": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.67.down_proj.weight_scale": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.67.gate_proj.weight": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.67.gate_proj.weight_scale": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.67.up_proj.weight": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.67.up_proj.weight_scale": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.68.down_proj.weight": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.68.down_proj.weight_scale": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.68.gate_proj.weight": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.68.gate_proj.weight_scale": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.68.up_proj.weight": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.68.up_proj.weight_scale": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.69.down_proj.weight": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.69.down_proj.weight_scale": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.69.gate_proj.weight": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.69.gate_proj.weight_scale": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.69.up_proj.weight": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.69.up_proj.weight_scale": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.7.down_proj.weight": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.7.down_proj.weight_scale": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.7.gate_proj.weight": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.7.gate_proj.weight_scale": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.7.up_proj.weight": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.7.up_proj.weight_scale": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.70.down_proj.weight": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.70.down_proj.weight_scale": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.70.gate_proj.weight": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.70.gate_proj.weight_scale": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.70.up_proj.weight": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.70.up_proj.weight_scale": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.71.down_proj.weight": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.71.down_proj.weight_scale": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.71.gate_proj.weight": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.71.gate_proj.weight_scale": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.71.up_proj.weight": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.71.up_proj.weight_scale": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.72.down_proj.weight": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.72.down_proj.weight_scale": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.72.gate_proj.weight": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.72.gate_proj.weight_scale": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.72.up_proj.weight": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.72.up_proj.weight_scale": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.73.down_proj.weight": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.73.down_proj.weight_scale": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.73.gate_proj.weight": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.73.gate_proj.weight_scale": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.73.up_proj.weight": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.73.up_proj.weight_scale": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.74.down_proj.weight": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.74.down_proj.weight_scale": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.74.gate_proj.weight": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.74.gate_proj.weight_scale": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.74.up_proj.weight": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.74.up_proj.weight_scale": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.75.down_proj.weight": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.75.down_proj.weight_scale": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.75.gate_proj.weight": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.75.gate_proj.weight_scale": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.75.up_proj.weight": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.75.up_proj.weight_scale": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.76.down_proj.weight": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.76.down_proj.weight_scale": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.76.gate_proj.weight": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.76.gate_proj.weight_scale": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.76.up_proj.weight": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.76.up_proj.weight_scale": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.77.down_proj.weight": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.77.down_proj.weight_scale": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.77.gate_proj.weight": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.77.gate_proj.weight_scale": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.77.up_proj.weight": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.77.up_proj.weight_scale": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.78.down_proj.weight": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.78.down_proj.weight_scale": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.78.gate_proj.weight": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.78.gate_proj.weight_scale": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.78.up_proj.weight": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.78.up_proj.weight_scale": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.79.down_proj.weight": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.79.down_proj.weight_scale": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.79.gate_proj.weight": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.79.gate_proj.weight_scale": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.79.up_proj.weight": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.79.up_proj.weight_scale": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.8.down_proj.weight": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.8.down_proj.weight_scale": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.8.gate_proj.weight": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.8.gate_proj.weight_scale": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.8.up_proj.weight": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.8.up_proj.weight_scale": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.80.down_proj.weight": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.80.down_proj.weight_scale": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.80.gate_proj.weight": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.80.gate_proj.weight_scale": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.80.up_proj.weight": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.80.up_proj.weight_scale": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.81.down_proj.weight": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.81.down_proj.weight_scale": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.81.gate_proj.weight": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.81.gate_proj.weight_scale": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.81.up_proj.weight": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.81.up_proj.weight_scale": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.82.down_proj.weight": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.82.down_proj.weight_scale": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.82.gate_proj.weight": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.82.gate_proj.weight_scale": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.82.up_proj.weight": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.82.up_proj.weight_scale": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.83.down_proj.weight": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.83.down_proj.weight_scale": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.83.gate_proj.weight": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.83.gate_proj.weight_scale": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.83.up_proj.weight": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.83.up_proj.weight_scale": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.84.down_proj.weight": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.84.down_proj.weight_scale": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.84.gate_proj.weight": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.84.gate_proj.weight_scale": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.84.up_proj.weight": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.84.up_proj.weight_scale": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.85.down_proj.weight": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.85.down_proj.weight_scale": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.85.gate_proj.weight": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.85.gate_proj.weight_scale": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.85.up_proj.weight": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.85.up_proj.weight_scale": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.86.down_proj.weight": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.86.down_proj.weight_scale": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.86.gate_proj.weight": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.86.gate_proj.weight_scale": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.86.up_proj.weight": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.86.up_proj.weight_scale": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.87.down_proj.weight": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.87.down_proj.weight_scale": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.87.gate_proj.weight": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.87.gate_proj.weight_scale": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.87.up_proj.weight": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.87.up_proj.weight_scale": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.88.down_proj.weight": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.88.down_proj.weight_scale": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.88.gate_proj.weight": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.88.gate_proj.weight_scale": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.88.up_proj.weight": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.88.up_proj.weight_scale": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.89.down_proj.weight": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.89.down_proj.weight_scale": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.89.gate_proj.weight": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.89.gate_proj.weight_scale": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.89.up_proj.weight": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.89.up_proj.weight_scale": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.9.down_proj.weight": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.9.down_proj.weight_scale": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.9.gate_proj.weight": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.9.gate_proj.weight_scale": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.9.up_proj.weight": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.9.up_proj.weight_scale": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.90.down_proj.weight": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.90.down_proj.weight_scale": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.90.gate_proj.weight": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.90.gate_proj.weight_scale": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.90.up_proj.weight": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.90.up_proj.weight_scale": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.91.down_proj.weight": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.91.down_proj.weight_scale": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.91.gate_proj.weight": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.91.gate_proj.weight_scale": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.91.up_proj.weight": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.91.up_proj.weight_scale": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.92.down_proj.weight": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.92.down_proj.weight_scale": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.92.gate_proj.weight": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.92.gate_proj.weight_scale": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.92.up_proj.weight": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.92.up_proj.weight_scale": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.93.down_proj.weight": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.93.down_proj.weight_scale": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.93.gate_proj.weight": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.93.gate_proj.weight_scale": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.93.up_proj.weight": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.93.up_proj.weight_scale": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.94.down_proj.weight": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.94.down_proj.weight_scale": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.94.gate_proj.weight": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.94.gate_proj.weight_scale": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.94.up_proj.weight": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.94.up_proj.weight_scale": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.95.down_proj.weight": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.95.down_proj.weight_scale": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.95.gate_proj.weight": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.95.gate_proj.weight_scale": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.95.up_proj.weight": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.95.up_proj.weight_scale": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.96.down_proj.weight": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.96.down_proj.weight_scale": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.96.gate_proj.weight": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.96.gate_proj.weight_scale": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.96.up_proj.weight": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.96.up_proj.weight_scale": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.97.down_proj.weight": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.97.down_proj.weight_scale": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.97.gate_proj.weight": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.97.gate_proj.weight_scale": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.97.up_proj.weight": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.97.up_proj.weight_scale": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.98.down_proj.weight": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.98.down_proj.weight_scale": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.98.gate_proj.weight": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.98.gate_proj.weight_scale": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.98.up_proj.weight": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.98.up_proj.weight_scale": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.99.down_proj.weight": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.99.down_proj.weight_scale": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.99.gate_proj.weight": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.99.gate_proj.weight_scale": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.99.up_proj.weight": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.99.up_proj.weight_scale": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.gate.e_score_correction_bias": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.gate.weight": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.shared_experts.down_proj.weight": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.shared_experts.down_proj.weight_scale": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.shared_experts.gate_proj.weight": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.shared_experts.gate_proj.weight_scale": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.shared_experts.up_proj.weight": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.shared_experts.up_proj.weight_scale": "model-00066-of-00092.safetensors",
+ "model.layers.65.post_attention_layernorm.weight": "model-00066-of-00092.safetensors",
+ "model.layers.65.self_attn.k_norm.weight": "model-00066-of-00092.safetensors",
+ "model.layers.65.self_attn.k_proj.bias": "model-00066-of-00092.safetensors",
+ "model.layers.65.self_attn.k_proj.weight": "model-00066-of-00092.safetensors",
+ "model.layers.65.self_attn.k_proj.weight_scale": "model-00066-of-00092.safetensors",
+ "model.layers.65.self_attn.o_proj.weight": "model-00066-of-00092.safetensors",
+ "model.layers.65.self_attn.o_proj.weight_scale": "model-00066-of-00092.safetensors",
+ "model.layers.65.self_attn.q_norm.weight": "model-00066-of-00092.safetensors",
+ "model.layers.65.self_attn.q_proj.bias": "model-00066-of-00092.safetensors",
+ "model.layers.65.self_attn.q_proj.weight": "model-00066-of-00092.safetensors",
+ "model.layers.65.self_attn.q_proj.weight_scale": "model-00066-of-00092.safetensors",
+ "model.layers.65.self_attn.v_proj.bias": "model-00066-of-00092.safetensors",
+ "model.layers.65.self_attn.v_proj.weight": "model-00066-of-00092.safetensors",
+ "model.layers.65.self_attn.v_proj.weight_scale": "model-00066-of-00092.safetensors",
+ "model.layers.66.input_layernorm.weight": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.0.down_proj.weight": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.0.down_proj.weight_scale": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.0.gate_proj.weight": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.0.gate_proj.weight_scale": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.0.up_proj.weight": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.0.up_proj.weight_scale": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.1.down_proj.weight": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.1.down_proj.weight_scale": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.1.gate_proj.weight": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.1.gate_proj.weight_scale": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.1.up_proj.weight": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.1.up_proj.weight_scale": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.10.down_proj.weight": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.10.down_proj.weight_scale": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.10.gate_proj.weight": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.10.gate_proj.weight_scale": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.10.up_proj.weight": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.10.up_proj.weight_scale": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.100.down_proj.weight": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.100.down_proj.weight_scale": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.100.gate_proj.weight": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.100.gate_proj.weight_scale": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.100.up_proj.weight": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.100.up_proj.weight_scale": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.101.down_proj.weight": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.101.down_proj.weight_scale": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.101.gate_proj.weight": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.101.gate_proj.weight_scale": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.101.up_proj.weight": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.101.up_proj.weight_scale": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.102.down_proj.weight": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.102.down_proj.weight_scale": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.102.gate_proj.weight": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.102.gate_proj.weight_scale": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.102.up_proj.weight": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.102.up_proj.weight_scale": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.103.down_proj.weight": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.103.down_proj.weight_scale": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.103.gate_proj.weight": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.103.gate_proj.weight_scale": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.103.up_proj.weight": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.103.up_proj.weight_scale": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.104.down_proj.weight": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.104.down_proj.weight_scale": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.104.gate_proj.weight": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.104.gate_proj.weight_scale": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.104.up_proj.weight": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.104.up_proj.weight_scale": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.105.down_proj.weight": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.105.down_proj.weight_scale": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.105.gate_proj.weight": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.105.gate_proj.weight_scale": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.105.up_proj.weight": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.105.up_proj.weight_scale": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.106.down_proj.weight": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.106.down_proj.weight_scale": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.106.gate_proj.weight": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.106.gate_proj.weight_scale": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.106.up_proj.weight": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.106.up_proj.weight_scale": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.107.down_proj.weight": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.107.down_proj.weight_scale": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.107.gate_proj.weight": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.107.gate_proj.weight_scale": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.107.up_proj.weight": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.107.up_proj.weight_scale": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.108.down_proj.weight": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.108.down_proj.weight_scale": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.108.gate_proj.weight": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.108.gate_proj.weight_scale": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.108.up_proj.weight": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.108.up_proj.weight_scale": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.109.down_proj.weight": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.109.down_proj.weight_scale": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.109.gate_proj.weight": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.109.gate_proj.weight_scale": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.109.up_proj.weight": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.109.up_proj.weight_scale": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.11.down_proj.weight": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.11.down_proj.weight_scale": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.11.gate_proj.weight": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.11.gate_proj.weight_scale": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.11.up_proj.weight": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.11.up_proj.weight_scale": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.110.down_proj.weight": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.110.down_proj.weight_scale": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.110.gate_proj.weight": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.110.gate_proj.weight_scale": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.110.up_proj.weight": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.110.up_proj.weight_scale": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.111.down_proj.weight": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.111.down_proj.weight_scale": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.111.gate_proj.weight": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.111.gate_proj.weight_scale": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.111.up_proj.weight": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.111.up_proj.weight_scale": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.112.down_proj.weight": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.112.down_proj.weight_scale": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.112.gate_proj.weight": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.112.gate_proj.weight_scale": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.112.up_proj.weight": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.112.up_proj.weight_scale": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.113.down_proj.weight": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.113.down_proj.weight_scale": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.113.gate_proj.weight": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.113.gate_proj.weight_scale": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.113.up_proj.weight": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.113.up_proj.weight_scale": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.114.down_proj.weight": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.114.down_proj.weight_scale": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.114.gate_proj.weight": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.114.gate_proj.weight_scale": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.114.up_proj.weight": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.114.up_proj.weight_scale": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.115.down_proj.weight": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.115.down_proj.weight_scale": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.115.gate_proj.weight": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.115.gate_proj.weight_scale": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.115.up_proj.weight": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.115.up_proj.weight_scale": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.116.down_proj.weight": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.116.down_proj.weight_scale": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.116.gate_proj.weight": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.116.gate_proj.weight_scale": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.116.up_proj.weight": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.116.up_proj.weight_scale": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.117.down_proj.weight": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.117.down_proj.weight_scale": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.117.gate_proj.weight": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.117.gate_proj.weight_scale": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.117.up_proj.weight": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.117.up_proj.weight_scale": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.118.down_proj.weight": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.118.down_proj.weight_scale": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.118.gate_proj.weight": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.118.gate_proj.weight_scale": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.118.up_proj.weight": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.118.up_proj.weight_scale": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.119.down_proj.weight": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.119.down_proj.weight_scale": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.119.gate_proj.weight": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.119.gate_proj.weight_scale": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.119.up_proj.weight": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.119.up_proj.weight_scale": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.12.down_proj.weight": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.12.down_proj.weight_scale": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.12.gate_proj.weight": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.12.gate_proj.weight_scale": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.12.up_proj.weight": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.12.up_proj.weight_scale": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.120.down_proj.weight": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.120.down_proj.weight_scale": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.120.gate_proj.weight": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.120.gate_proj.weight_scale": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.120.up_proj.weight": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.120.up_proj.weight_scale": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.121.down_proj.weight": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.121.down_proj.weight_scale": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.121.gate_proj.weight": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.121.gate_proj.weight_scale": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.121.up_proj.weight": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.121.up_proj.weight_scale": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.122.down_proj.weight": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.122.down_proj.weight_scale": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.122.gate_proj.weight": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.122.gate_proj.weight_scale": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.122.up_proj.weight": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.122.up_proj.weight_scale": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.123.down_proj.weight": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.123.down_proj.weight_scale": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.123.gate_proj.weight": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.123.gate_proj.weight_scale": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.123.up_proj.weight": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.123.up_proj.weight_scale": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.124.down_proj.weight": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.124.down_proj.weight_scale": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.124.gate_proj.weight": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.124.gate_proj.weight_scale": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.124.up_proj.weight": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.124.up_proj.weight_scale": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.125.down_proj.weight": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.125.down_proj.weight_scale": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.125.gate_proj.weight": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.125.gate_proj.weight_scale": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.125.up_proj.weight": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.125.up_proj.weight_scale": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.126.down_proj.weight": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.126.down_proj.weight_scale": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.126.gate_proj.weight": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.126.gate_proj.weight_scale": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.126.up_proj.weight": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.126.up_proj.weight_scale": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.127.down_proj.weight": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.127.down_proj.weight_scale": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.127.gate_proj.weight": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.127.gate_proj.weight_scale": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.127.up_proj.weight": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.127.up_proj.weight_scale": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.128.down_proj.weight": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.128.down_proj.weight_scale": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.128.gate_proj.weight": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.128.gate_proj.weight_scale": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.128.up_proj.weight": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.128.up_proj.weight_scale": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.129.down_proj.weight": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.129.down_proj.weight_scale": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.129.gate_proj.weight": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.129.gate_proj.weight_scale": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.129.up_proj.weight": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.129.up_proj.weight_scale": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.13.down_proj.weight": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.13.down_proj.weight_scale": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.13.gate_proj.weight": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.13.gate_proj.weight_scale": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.13.up_proj.weight": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.13.up_proj.weight_scale": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.130.down_proj.weight": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.130.down_proj.weight_scale": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.130.gate_proj.weight": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.130.gate_proj.weight_scale": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.130.up_proj.weight": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.130.up_proj.weight_scale": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.131.down_proj.weight": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.131.down_proj.weight_scale": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.131.gate_proj.weight": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.131.gate_proj.weight_scale": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.131.up_proj.weight": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.131.up_proj.weight_scale": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.132.down_proj.weight": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.132.down_proj.weight_scale": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.132.gate_proj.weight": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.132.gate_proj.weight_scale": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.132.up_proj.weight": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.132.up_proj.weight_scale": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.133.down_proj.weight": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.133.down_proj.weight_scale": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.133.gate_proj.weight": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.133.gate_proj.weight_scale": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.133.up_proj.weight": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.133.up_proj.weight_scale": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.134.down_proj.weight": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.134.down_proj.weight_scale": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.134.gate_proj.weight": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.134.gate_proj.weight_scale": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.134.up_proj.weight": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.134.up_proj.weight_scale": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.135.down_proj.weight": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.135.down_proj.weight_scale": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.135.gate_proj.weight": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.135.gate_proj.weight_scale": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.135.up_proj.weight": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.135.up_proj.weight_scale": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.136.down_proj.weight": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.136.down_proj.weight_scale": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.136.gate_proj.weight": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.136.gate_proj.weight_scale": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.136.up_proj.weight": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.136.up_proj.weight_scale": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.137.down_proj.weight": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.137.down_proj.weight_scale": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.137.gate_proj.weight": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.137.gate_proj.weight_scale": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.137.up_proj.weight": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.137.up_proj.weight_scale": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.138.down_proj.weight": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.138.down_proj.weight_scale": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.138.gate_proj.weight": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.138.gate_proj.weight_scale": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.138.up_proj.weight": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.138.up_proj.weight_scale": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.139.down_proj.weight": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.139.down_proj.weight_scale": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.139.gate_proj.weight": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.139.gate_proj.weight_scale": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.139.up_proj.weight": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.139.up_proj.weight_scale": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.14.down_proj.weight": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.14.down_proj.weight_scale": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.14.gate_proj.weight": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.14.gate_proj.weight_scale": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.14.up_proj.weight": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.14.up_proj.weight_scale": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.140.down_proj.weight": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.140.down_proj.weight_scale": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.140.gate_proj.weight": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.140.gate_proj.weight_scale": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.140.up_proj.weight": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.140.up_proj.weight_scale": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.141.down_proj.weight": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.141.down_proj.weight_scale": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.141.gate_proj.weight": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.141.gate_proj.weight_scale": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.141.up_proj.weight": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.141.up_proj.weight_scale": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.142.down_proj.weight": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.142.down_proj.weight_scale": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.142.gate_proj.weight": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.142.gate_proj.weight_scale": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.142.up_proj.weight": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.142.up_proj.weight_scale": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.143.down_proj.weight": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.143.down_proj.weight_scale": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.143.gate_proj.weight": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.143.gate_proj.weight_scale": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.143.up_proj.weight": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.143.up_proj.weight_scale": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.144.down_proj.weight": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.144.down_proj.weight_scale": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.144.gate_proj.weight": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.144.gate_proj.weight_scale": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.144.up_proj.weight": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.144.up_proj.weight_scale": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.145.down_proj.weight": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.145.down_proj.weight_scale": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.145.gate_proj.weight": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.145.gate_proj.weight_scale": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.145.up_proj.weight": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.145.up_proj.weight_scale": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.146.down_proj.weight": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.146.down_proj.weight_scale": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.146.gate_proj.weight": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.146.gate_proj.weight_scale": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.146.up_proj.weight": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.146.up_proj.weight_scale": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.147.down_proj.weight": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.147.down_proj.weight_scale": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.147.gate_proj.weight": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.147.gate_proj.weight_scale": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.147.up_proj.weight": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.147.up_proj.weight_scale": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.148.down_proj.weight": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.148.down_proj.weight_scale": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.148.gate_proj.weight": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.148.gate_proj.weight_scale": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.148.up_proj.weight": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.148.up_proj.weight_scale": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.149.down_proj.weight": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.149.down_proj.weight_scale": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.149.gate_proj.weight": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.149.gate_proj.weight_scale": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.149.up_proj.weight": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.149.up_proj.weight_scale": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.15.down_proj.weight": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.15.down_proj.weight_scale": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.15.gate_proj.weight": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.15.gate_proj.weight_scale": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.15.up_proj.weight": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.15.up_proj.weight_scale": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.150.down_proj.weight": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.150.down_proj.weight_scale": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.150.gate_proj.weight": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.150.gate_proj.weight_scale": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.150.up_proj.weight": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.150.up_proj.weight_scale": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.151.down_proj.weight": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.151.down_proj.weight_scale": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.151.gate_proj.weight": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.151.gate_proj.weight_scale": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.151.up_proj.weight": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.151.up_proj.weight_scale": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.152.down_proj.weight": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.152.down_proj.weight_scale": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.152.gate_proj.weight": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.152.gate_proj.weight_scale": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.152.up_proj.weight": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.152.up_proj.weight_scale": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.153.down_proj.weight": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.153.down_proj.weight_scale": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.153.gate_proj.weight": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.153.gate_proj.weight_scale": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.153.up_proj.weight": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.153.up_proj.weight_scale": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.154.down_proj.weight": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.154.down_proj.weight_scale": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.154.gate_proj.weight": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.154.gate_proj.weight_scale": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.154.up_proj.weight": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.154.up_proj.weight_scale": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.155.down_proj.weight": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.155.down_proj.weight_scale": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.155.gate_proj.weight": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.155.gate_proj.weight_scale": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.155.up_proj.weight": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.155.up_proj.weight_scale": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.156.down_proj.weight": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.156.down_proj.weight_scale": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.156.gate_proj.weight": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.156.gate_proj.weight_scale": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.156.up_proj.weight": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.156.up_proj.weight_scale": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.157.down_proj.weight": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.157.down_proj.weight_scale": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.157.gate_proj.weight": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.157.gate_proj.weight_scale": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.157.up_proj.weight": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.157.up_proj.weight_scale": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.158.down_proj.weight": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.158.down_proj.weight_scale": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.158.gate_proj.weight": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.158.gate_proj.weight_scale": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.158.up_proj.weight": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.158.up_proj.weight_scale": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.159.down_proj.weight": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.159.down_proj.weight_scale": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.159.gate_proj.weight": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.159.gate_proj.weight_scale": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.159.up_proj.weight": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.159.up_proj.weight_scale": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.16.down_proj.weight": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.16.down_proj.weight_scale": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.16.gate_proj.weight": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.16.gate_proj.weight_scale": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.16.up_proj.weight": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.16.up_proj.weight_scale": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.17.down_proj.weight": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.17.down_proj.weight_scale": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.17.gate_proj.weight": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.17.gate_proj.weight_scale": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.17.up_proj.weight": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.17.up_proj.weight_scale": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.18.down_proj.weight": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.18.down_proj.weight_scale": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.18.gate_proj.weight": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.18.gate_proj.weight_scale": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.18.up_proj.weight": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.18.up_proj.weight_scale": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.19.down_proj.weight": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.19.down_proj.weight_scale": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.19.gate_proj.weight": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.19.gate_proj.weight_scale": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.19.up_proj.weight": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.19.up_proj.weight_scale": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.2.down_proj.weight": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.2.down_proj.weight_scale": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.2.gate_proj.weight": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.2.gate_proj.weight_scale": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.2.up_proj.weight": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.2.up_proj.weight_scale": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.20.down_proj.weight": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.20.down_proj.weight_scale": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.20.gate_proj.weight": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.20.gate_proj.weight_scale": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.20.up_proj.weight": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.20.up_proj.weight_scale": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.21.down_proj.weight": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.21.down_proj.weight_scale": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.21.gate_proj.weight": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.21.gate_proj.weight_scale": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.21.up_proj.weight": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.21.up_proj.weight_scale": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.22.down_proj.weight": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.22.down_proj.weight_scale": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.22.gate_proj.weight": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.22.gate_proj.weight_scale": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.22.up_proj.weight": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.22.up_proj.weight_scale": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.23.down_proj.weight": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.23.down_proj.weight_scale": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.23.gate_proj.weight": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.23.gate_proj.weight_scale": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.23.up_proj.weight": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.23.up_proj.weight_scale": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.24.down_proj.weight": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.24.down_proj.weight_scale": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.24.gate_proj.weight": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.24.gate_proj.weight_scale": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.24.up_proj.weight": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.24.up_proj.weight_scale": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.25.down_proj.weight": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.25.down_proj.weight_scale": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.25.gate_proj.weight": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.25.gate_proj.weight_scale": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.25.up_proj.weight": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.25.up_proj.weight_scale": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.26.down_proj.weight": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.26.down_proj.weight_scale": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.26.gate_proj.weight": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.26.gate_proj.weight_scale": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.26.up_proj.weight": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.26.up_proj.weight_scale": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.27.down_proj.weight": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.27.down_proj.weight_scale": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.27.gate_proj.weight": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.27.gate_proj.weight_scale": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.27.up_proj.weight": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.27.up_proj.weight_scale": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.28.down_proj.weight": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.28.down_proj.weight_scale": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.28.gate_proj.weight": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.28.gate_proj.weight_scale": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.28.up_proj.weight": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.28.up_proj.weight_scale": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.29.down_proj.weight": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.29.down_proj.weight_scale": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.29.gate_proj.weight": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.29.gate_proj.weight_scale": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.29.up_proj.weight": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.29.up_proj.weight_scale": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.3.down_proj.weight": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.3.down_proj.weight_scale": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.3.gate_proj.weight": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.3.gate_proj.weight_scale": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.3.up_proj.weight": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.3.up_proj.weight_scale": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.30.down_proj.weight": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.30.down_proj.weight_scale": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.30.gate_proj.weight": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.30.gate_proj.weight_scale": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.30.up_proj.weight": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.30.up_proj.weight_scale": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.31.down_proj.weight": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.31.down_proj.weight_scale": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.31.gate_proj.weight": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.31.gate_proj.weight_scale": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.31.up_proj.weight": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.31.up_proj.weight_scale": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.32.down_proj.weight": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.32.down_proj.weight_scale": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.32.gate_proj.weight": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.32.gate_proj.weight_scale": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.32.up_proj.weight": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.32.up_proj.weight_scale": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.33.down_proj.weight": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.33.down_proj.weight_scale": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.33.gate_proj.weight": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.33.gate_proj.weight_scale": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.33.up_proj.weight": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.33.up_proj.weight_scale": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.34.down_proj.weight": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.34.down_proj.weight_scale": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.34.gate_proj.weight": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.34.gate_proj.weight_scale": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.34.up_proj.weight": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.34.up_proj.weight_scale": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.35.down_proj.weight": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.35.down_proj.weight_scale": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.35.gate_proj.weight": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.35.gate_proj.weight_scale": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.35.up_proj.weight": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.35.up_proj.weight_scale": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.36.down_proj.weight": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.36.down_proj.weight_scale": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.36.gate_proj.weight": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.36.gate_proj.weight_scale": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.36.up_proj.weight": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.36.up_proj.weight_scale": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.37.down_proj.weight": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.37.down_proj.weight_scale": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.37.gate_proj.weight": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.37.gate_proj.weight_scale": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.37.up_proj.weight": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.37.up_proj.weight_scale": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.38.down_proj.weight": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.38.down_proj.weight_scale": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.38.gate_proj.weight": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.38.gate_proj.weight_scale": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.38.up_proj.weight": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.38.up_proj.weight_scale": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.39.down_proj.weight": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.39.down_proj.weight_scale": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.39.gate_proj.weight": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.39.gate_proj.weight_scale": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.39.up_proj.weight": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.39.up_proj.weight_scale": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.4.down_proj.weight": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.4.down_proj.weight_scale": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.4.gate_proj.weight": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.4.gate_proj.weight_scale": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.4.up_proj.weight": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.4.up_proj.weight_scale": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.40.down_proj.weight": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.40.down_proj.weight_scale": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.40.gate_proj.weight": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.40.gate_proj.weight_scale": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.40.up_proj.weight": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.40.up_proj.weight_scale": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.41.down_proj.weight": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.41.down_proj.weight_scale": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.41.gate_proj.weight": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.41.gate_proj.weight_scale": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.41.up_proj.weight": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.41.up_proj.weight_scale": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.42.down_proj.weight": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.42.down_proj.weight_scale": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.42.gate_proj.weight": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.42.gate_proj.weight_scale": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.42.up_proj.weight": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.42.up_proj.weight_scale": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.43.down_proj.weight": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.43.down_proj.weight_scale": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.43.gate_proj.weight": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.43.gate_proj.weight_scale": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.43.up_proj.weight": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.43.up_proj.weight_scale": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.44.down_proj.weight": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.44.down_proj.weight_scale": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.44.gate_proj.weight": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.44.gate_proj.weight_scale": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.44.up_proj.weight": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.44.up_proj.weight_scale": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.45.down_proj.weight": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.45.down_proj.weight_scale": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.45.gate_proj.weight": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.45.gate_proj.weight_scale": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.45.up_proj.weight": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.45.up_proj.weight_scale": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.46.down_proj.weight": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.46.down_proj.weight_scale": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.46.gate_proj.weight": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.46.gate_proj.weight_scale": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.46.up_proj.weight": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.46.up_proj.weight_scale": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.47.down_proj.weight": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.47.down_proj.weight_scale": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.47.gate_proj.weight": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.47.gate_proj.weight_scale": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.47.up_proj.weight": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.47.up_proj.weight_scale": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.48.down_proj.weight": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.48.down_proj.weight_scale": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.48.gate_proj.weight": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.48.gate_proj.weight_scale": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.48.up_proj.weight": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.48.up_proj.weight_scale": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.49.down_proj.weight": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.49.down_proj.weight_scale": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.49.gate_proj.weight": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.49.gate_proj.weight_scale": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.49.up_proj.weight": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.49.up_proj.weight_scale": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.5.down_proj.weight": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.5.down_proj.weight_scale": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.5.gate_proj.weight": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.5.gate_proj.weight_scale": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.5.up_proj.weight": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.5.up_proj.weight_scale": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.50.down_proj.weight": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.50.down_proj.weight_scale": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.50.gate_proj.weight": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.50.gate_proj.weight_scale": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.50.up_proj.weight": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.50.up_proj.weight_scale": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.51.down_proj.weight": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.51.down_proj.weight_scale": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.51.gate_proj.weight": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.51.gate_proj.weight_scale": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.51.up_proj.weight": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.51.up_proj.weight_scale": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.52.down_proj.weight": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.52.down_proj.weight_scale": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.52.gate_proj.weight": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.52.gate_proj.weight_scale": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.52.up_proj.weight": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.52.up_proj.weight_scale": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.53.down_proj.weight": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.53.down_proj.weight_scale": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.53.gate_proj.weight": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.53.gate_proj.weight_scale": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.53.up_proj.weight": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.53.up_proj.weight_scale": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.54.down_proj.weight": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.54.down_proj.weight_scale": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.54.gate_proj.weight": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.54.gate_proj.weight_scale": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.54.up_proj.weight": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.54.up_proj.weight_scale": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.55.down_proj.weight": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.55.down_proj.weight_scale": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.55.gate_proj.weight": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.55.gate_proj.weight_scale": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.55.up_proj.weight": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.55.up_proj.weight_scale": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.56.down_proj.weight": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.56.down_proj.weight_scale": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.56.gate_proj.weight": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.56.gate_proj.weight_scale": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.56.up_proj.weight": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.56.up_proj.weight_scale": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.57.down_proj.weight": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.57.down_proj.weight_scale": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.57.gate_proj.weight": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.57.gate_proj.weight_scale": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.57.up_proj.weight": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.57.up_proj.weight_scale": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.58.down_proj.weight": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.58.down_proj.weight_scale": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.58.gate_proj.weight": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.58.gate_proj.weight_scale": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.58.up_proj.weight": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.58.up_proj.weight_scale": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.59.down_proj.weight": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.59.down_proj.weight_scale": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.59.gate_proj.weight": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.59.gate_proj.weight_scale": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.59.up_proj.weight": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.59.up_proj.weight_scale": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.6.down_proj.weight": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.6.down_proj.weight_scale": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.6.gate_proj.weight": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.6.gate_proj.weight_scale": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.6.up_proj.weight": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.6.up_proj.weight_scale": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.60.down_proj.weight": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.60.down_proj.weight_scale": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.60.gate_proj.weight": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.60.gate_proj.weight_scale": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.60.up_proj.weight": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.60.up_proj.weight_scale": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.61.down_proj.weight": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.61.down_proj.weight_scale": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.61.gate_proj.weight": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.61.gate_proj.weight_scale": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.61.up_proj.weight": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.61.up_proj.weight_scale": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.62.down_proj.weight": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.62.down_proj.weight_scale": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.62.gate_proj.weight": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.62.gate_proj.weight_scale": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.62.up_proj.weight": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.62.up_proj.weight_scale": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.63.down_proj.weight": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.63.down_proj.weight_scale": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.63.gate_proj.weight": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.63.gate_proj.weight_scale": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.63.up_proj.weight": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.63.up_proj.weight_scale": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.64.down_proj.weight": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.64.down_proj.weight_scale": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.64.gate_proj.weight": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.64.gate_proj.weight_scale": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.64.up_proj.weight": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.64.up_proj.weight_scale": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.65.down_proj.weight": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.65.down_proj.weight_scale": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.65.gate_proj.weight": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.65.gate_proj.weight_scale": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.65.up_proj.weight": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.65.up_proj.weight_scale": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.66.down_proj.weight": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.66.down_proj.weight_scale": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.66.gate_proj.weight": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.66.gate_proj.weight_scale": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.66.up_proj.weight": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.66.up_proj.weight_scale": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.67.down_proj.weight": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.67.down_proj.weight_scale": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.67.gate_proj.weight": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.67.gate_proj.weight_scale": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.67.up_proj.weight": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.67.up_proj.weight_scale": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.68.down_proj.weight": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.68.down_proj.weight_scale": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.68.gate_proj.weight": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.68.gate_proj.weight_scale": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.68.up_proj.weight": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.68.up_proj.weight_scale": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.69.down_proj.weight": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.69.down_proj.weight_scale": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.69.gate_proj.weight": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.69.gate_proj.weight_scale": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.69.up_proj.weight": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.69.up_proj.weight_scale": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.7.down_proj.weight": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.7.down_proj.weight_scale": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.7.gate_proj.weight": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.7.gate_proj.weight_scale": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.7.up_proj.weight": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.7.up_proj.weight_scale": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.70.down_proj.weight": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.70.down_proj.weight_scale": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.70.gate_proj.weight": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.70.gate_proj.weight_scale": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.70.up_proj.weight": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.70.up_proj.weight_scale": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.71.down_proj.weight": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.71.down_proj.weight_scale": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.71.gate_proj.weight": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.71.gate_proj.weight_scale": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.71.up_proj.weight": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.71.up_proj.weight_scale": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.72.down_proj.weight": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.72.down_proj.weight_scale": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.72.gate_proj.weight": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.72.gate_proj.weight_scale": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.72.up_proj.weight": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.72.up_proj.weight_scale": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.73.down_proj.weight": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.73.down_proj.weight_scale": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.73.gate_proj.weight": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.73.gate_proj.weight_scale": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.73.up_proj.weight": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.73.up_proj.weight_scale": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.74.down_proj.weight": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.74.down_proj.weight_scale": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.74.gate_proj.weight": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.74.gate_proj.weight_scale": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.74.up_proj.weight": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.74.up_proj.weight_scale": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.75.down_proj.weight": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.75.down_proj.weight_scale": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.75.gate_proj.weight": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.75.gate_proj.weight_scale": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.75.up_proj.weight": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.75.up_proj.weight_scale": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.76.down_proj.weight": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.76.down_proj.weight_scale": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.76.gate_proj.weight": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.76.gate_proj.weight_scale": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.76.up_proj.weight": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.76.up_proj.weight_scale": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.77.down_proj.weight": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.77.down_proj.weight_scale": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.77.gate_proj.weight": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.77.gate_proj.weight_scale": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.77.up_proj.weight": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.77.up_proj.weight_scale": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.78.down_proj.weight": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.78.down_proj.weight_scale": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.78.gate_proj.weight": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.78.gate_proj.weight_scale": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.78.up_proj.weight": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.78.up_proj.weight_scale": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.79.down_proj.weight": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.79.down_proj.weight_scale": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.79.gate_proj.weight": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.79.gate_proj.weight_scale": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.79.up_proj.weight": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.79.up_proj.weight_scale": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.8.down_proj.weight": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.8.down_proj.weight_scale": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.8.gate_proj.weight": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.8.gate_proj.weight_scale": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.8.up_proj.weight": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.8.up_proj.weight_scale": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.80.down_proj.weight": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.80.down_proj.weight_scale": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.80.gate_proj.weight": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.80.gate_proj.weight_scale": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.80.up_proj.weight": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.80.up_proj.weight_scale": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.81.down_proj.weight": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.81.down_proj.weight_scale": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.81.gate_proj.weight": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.81.gate_proj.weight_scale": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.81.up_proj.weight": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.81.up_proj.weight_scale": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.82.down_proj.weight": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.82.down_proj.weight_scale": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.82.gate_proj.weight": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.82.gate_proj.weight_scale": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.82.up_proj.weight": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.82.up_proj.weight_scale": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.83.down_proj.weight": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.83.down_proj.weight_scale": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.83.gate_proj.weight": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.83.gate_proj.weight_scale": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.83.up_proj.weight": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.83.up_proj.weight_scale": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.84.down_proj.weight": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.84.down_proj.weight_scale": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.84.gate_proj.weight": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.84.gate_proj.weight_scale": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.84.up_proj.weight": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.84.up_proj.weight_scale": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.85.down_proj.weight": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.85.down_proj.weight_scale": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.85.gate_proj.weight": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.85.gate_proj.weight_scale": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.85.up_proj.weight": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.85.up_proj.weight_scale": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.86.down_proj.weight": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.86.down_proj.weight_scale": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.86.gate_proj.weight": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.86.gate_proj.weight_scale": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.86.up_proj.weight": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.86.up_proj.weight_scale": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.87.down_proj.weight": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.87.down_proj.weight_scale": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.87.gate_proj.weight": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.87.gate_proj.weight_scale": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.87.up_proj.weight": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.87.up_proj.weight_scale": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.88.down_proj.weight": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.88.down_proj.weight_scale": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.88.gate_proj.weight": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.88.gate_proj.weight_scale": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.88.up_proj.weight": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.88.up_proj.weight_scale": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.89.down_proj.weight": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.89.down_proj.weight_scale": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.89.gate_proj.weight": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.89.gate_proj.weight_scale": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.89.up_proj.weight": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.89.up_proj.weight_scale": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.9.down_proj.weight": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.9.down_proj.weight_scale": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.9.gate_proj.weight": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.9.gate_proj.weight_scale": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.9.up_proj.weight": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.9.up_proj.weight_scale": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.90.down_proj.weight": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.90.down_proj.weight_scale": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.90.gate_proj.weight": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.90.gate_proj.weight_scale": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.90.up_proj.weight": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.90.up_proj.weight_scale": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.91.down_proj.weight": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.91.down_proj.weight_scale": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.91.gate_proj.weight": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.91.gate_proj.weight_scale": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.91.up_proj.weight": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.91.up_proj.weight_scale": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.92.down_proj.weight": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.92.down_proj.weight_scale": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.92.gate_proj.weight": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.92.gate_proj.weight_scale": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.92.up_proj.weight": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.92.up_proj.weight_scale": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.93.down_proj.weight": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.93.down_proj.weight_scale": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.93.gate_proj.weight": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.93.gate_proj.weight_scale": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.93.up_proj.weight": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.93.up_proj.weight_scale": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.94.down_proj.weight": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.94.down_proj.weight_scale": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.94.gate_proj.weight": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.94.gate_proj.weight_scale": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.94.up_proj.weight": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.94.up_proj.weight_scale": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.95.down_proj.weight": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.95.down_proj.weight_scale": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.95.gate_proj.weight": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.95.gate_proj.weight_scale": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.95.up_proj.weight": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.95.up_proj.weight_scale": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.96.down_proj.weight": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.96.down_proj.weight_scale": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.96.gate_proj.weight": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.96.gate_proj.weight_scale": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.96.up_proj.weight": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.96.up_proj.weight_scale": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.97.down_proj.weight": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.97.down_proj.weight_scale": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.97.gate_proj.weight": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.97.gate_proj.weight_scale": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.97.up_proj.weight": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.97.up_proj.weight_scale": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.98.down_proj.weight": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.98.down_proj.weight_scale": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.98.gate_proj.weight": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.98.gate_proj.weight_scale": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.98.up_proj.weight": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.98.up_proj.weight_scale": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.99.down_proj.weight": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.99.down_proj.weight_scale": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.99.gate_proj.weight": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.99.gate_proj.weight_scale": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.99.up_proj.weight": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.99.up_proj.weight_scale": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.gate.e_score_correction_bias": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.gate.weight": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.shared_experts.down_proj.weight": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.shared_experts.down_proj.weight_scale": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.shared_experts.gate_proj.weight": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.shared_experts.gate_proj.weight_scale": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.shared_experts.up_proj.weight": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.shared_experts.up_proj.weight_scale": "model-00067-of-00092.safetensors",
+ "model.layers.66.post_attention_layernorm.weight": "model-00067-of-00092.safetensors",
+ "model.layers.66.self_attn.k_norm.weight": "model-00067-of-00092.safetensors",
+ "model.layers.66.self_attn.k_proj.bias": "model-00067-of-00092.safetensors",
+ "model.layers.66.self_attn.k_proj.weight": "model-00067-of-00092.safetensors",
+ "model.layers.66.self_attn.k_proj.weight_scale": "model-00067-of-00092.safetensors",
+ "model.layers.66.self_attn.o_proj.weight": "model-00067-of-00092.safetensors",
+ "model.layers.66.self_attn.o_proj.weight_scale": "model-00067-of-00092.safetensors",
+ "model.layers.66.self_attn.q_norm.weight": "model-00067-of-00092.safetensors",
+ "model.layers.66.self_attn.q_proj.bias": "model-00067-of-00092.safetensors",
+ "model.layers.66.self_attn.q_proj.weight": "model-00067-of-00092.safetensors",
+ "model.layers.66.self_attn.q_proj.weight_scale": "model-00067-of-00092.safetensors",
+ "model.layers.66.self_attn.v_proj.bias": "model-00067-of-00092.safetensors",
+ "model.layers.66.self_attn.v_proj.weight": "model-00067-of-00092.safetensors",
+ "model.layers.66.self_attn.v_proj.weight_scale": "model-00067-of-00092.safetensors",
+ "model.layers.67.input_layernorm.weight": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.0.down_proj.weight": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.0.down_proj.weight_scale": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.0.gate_proj.weight": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.0.gate_proj.weight_scale": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.0.up_proj.weight": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.0.up_proj.weight_scale": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.1.down_proj.weight": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.1.down_proj.weight_scale": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.1.gate_proj.weight": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.1.gate_proj.weight_scale": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.1.up_proj.weight": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.1.up_proj.weight_scale": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.10.down_proj.weight": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.10.down_proj.weight_scale": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.10.gate_proj.weight": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.10.gate_proj.weight_scale": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.10.up_proj.weight": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.10.up_proj.weight_scale": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.100.down_proj.weight": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.100.down_proj.weight_scale": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.100.gate_proj.weight": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.100.gate_proj.weight_scale": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.100.up_proj.weight": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.100.up_proj.weight_scale": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.101.down_proj.weight": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.101.down_proj.weight_scale": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.101.gate_proj.weight": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.101.gate_proj.weight_scale": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.101.up_proj.weight": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.101.up_proj.weight_scale": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.102.down_proj.weight": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.102.down_proj.weight_scale": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.102.gate_proj.weight": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.102.gate_proj.weight_scale": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.102.up_proj.weight": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.102.up_proj.weight_scale": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.103.down_proj.weight": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.103.down_proj.weight_scale": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.103.gate_proj.weight": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.103.gate_proj.weight_scale": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.103.up_proj.weight": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.103.up_proj.weight_scale": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.104.down_proj.weight": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.104.down_proj.weight_scale": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.104.gate_proj.weight": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.104.gate_proj.weight_scale": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.104.up_proj.weight": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.104.up_proj.weight_scale": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.105.down_proj.weight": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.105.down_proj.weight_scale": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.105.gate_proj.weight": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.105.gate_proj.weight_scale": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.105.up_proj.weight": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.105.up_proj.weight_scale": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.106.down_proj.weight": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.106.down_proj.weight_scale": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.106.gate_proj.weight": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.106.gate_proj.weight_scale": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.106.up_proj.weight": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.106.up_proj.weight_scale": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.107.down_proj.weight": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.107.down_proj.weight_scale": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.107.gate_proj.weight": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.107.gate_proj.weight_scale": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.107.up_proj.weight": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.107.up_proj.weight_scale": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.108.down_proj.weight": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.108.down_proj.weight_scale": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.108.gate_proj.weight": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.108.gate_proj.weight_scale": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.108.up_proj.weight": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.108.up_proj.weight_scale": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.109.down_proj.weight": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.109.down_proj.weight_scale": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.109.gate_proj.weight": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.109.gate_proj.weight_scale": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.109.up_proj.weight": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.109.up_proj.weight_scale": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.11.down_proj.weight": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.11.down_proj.weight_scale": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.11.gate_proj.weight": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.11.gate_proj.weight_scale": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.11.up_proj.weight": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.11.up_proj.weight_scale": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.110.down_proj.weight": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.110.down_proj.weight_scale": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.110.gate_proj.weight": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.110.gate_proj.weight_scale": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.110.up_proj.weight": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.110.up_proj.weight_scale": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.111.down_proj.weight": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.111.down_proj.weight_scale": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.111.gate_proj.weight": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.111.gate_proj.weight_scale": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.111.up_proj.weight": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.111.up_proj.weight_scale": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.112.down_proj.weight": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.112.down_proj.weight_scale": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.112.gate_proj.weight": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.112.gate_proj.weight_scale": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.112.up_proj.weight": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.112.up_proj.weight_scale": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.113.down_proj.weight": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.113.down_proj.weight_scale": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.113.gate_proj.weight": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.113.gate_proj.weight_scale": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.113.up_proj.weight": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.113.up_proj.weight_scale": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.114.down_proj.weight": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.114.down_proj.weight_scale": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.114.gate_proj.weight": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.114.gate_proj.weight_scale": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.114.up_proj.weight": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.114.up_proj.weight_scale": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.115.down_proj.weight": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.115.down_proj.weight_scale": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.115.gate_proj.weight": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.115.gate_proj.weight_scale": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.115.up_proj.weight": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.115.up_proj.weight_scale": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.116.down_proj.weight": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.116.down_proj.weight_scale": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.116.gate_proj.weight": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.116.gate_proj.weight_scale": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.116.up_proj.weight": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.116.up_proj.weight_scale": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.117.down_proj.weight": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.117.down_proj.weight_scale": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.117.gate_proj.weight": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.117.gate_proj.weight_scale": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.117.up_proj.weight": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.117.up_proj.weight_scale": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.118.down_proj.weight": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.118.down_proj.weight_scale": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.118.gate_proj.weight": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.118.gate_proj.weight_scale": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.118.up_proj.weight": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.118.up_proj.weight_scale": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.119.down_proj.weight": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.119.down_proj.weight_scale": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.119.gate_proj.weight": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.119.gate_proj.weight_scale": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.119.up_proj.weight": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.119.up_proj.weight_scale": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.12.down_proj.weight": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.12.down_proj.weight_scale": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.12.gate_proj.weight": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.12.gate_proj.weight_scale": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.12.up_proj.weight": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.12.up_proj.weight_scale": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.120.down_proj.weight": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.120.down_proj.weight_scale": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.120.gate_proj.weight": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.120.gate_proj.weight_scale": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.120.up_proj.weight": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.120.up_proj.weight_scale": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.121.down_proj.weight": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.121.down_proj.weight_scale": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.121.gate_proj.weight": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.121.gate_proj.weight_scale": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.121.up_proj.weight": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.121.up_proj.weight_scale": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.122.down_proj.weight": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.122.down_proj.weight_scale": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.122.gate_proj.weight": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.122.gate_proj.weight_scale": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.122.up_proj.weight": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.122.up_proj.weight_scale": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.123.down_proj.weight": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.123.down_proj.weight_scale": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.123.gate_proj.weight": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.123.gate_proj.weight_scale": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.123.up_proj.weight": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.123.up_proj.weight_scale": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.124.down_proj.weight": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.124.down_proj.weight_scale": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.124.gate_proj.weight": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.124.gate_proj.weight_scale": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.124.up_proj.weight": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.124.up_proj.weight_scale": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.125.down_proj.weight": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.125.down_proj.weight_scale": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.125.gate_proj.weight": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.125.gate_proj.weight_scale": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.125.up_proj.weight": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.125.up_proj.weight_scale": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.126.down_proj.weight": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.126.down_proj.weight_scale": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.126.gate_proj.weight": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.126.gate_proj.weight_scale": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.126.up_proj.weight": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.126.up_proj.weight_scale": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.127.down_proj.weight": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.127.down_proj.weight_scale": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.127.gate_proj.weight": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.127.gate_proj.weight_scale": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.127.up_proj.weight": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.127.up_proj.weight_scale": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.128.down_proj.weight": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.128.down_proj.weight_scale": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.128.gate_proj.weight": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.128.gate_proj.weight_scale": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.128.up_proj.weight": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.128.up_proj.weight_scale": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.129.down_proj.weight": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.129.down_proj.weight_scale": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.129.gate_proj.weight": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.129.gate_proj.weight_scale": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.129.up_proj.weight": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.129.up_proj.weight_scale": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.13.down_proj.weight": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.13.down_proj.weight_scale": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.13.gate_proj.weight": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.13.gate_proj.weight_scale": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.13.up_proj.weight": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.13.up_proj.weight_scale": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.130.down_proj.weight": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.130.down_proj.weight_scale": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.130.gate_proj.weight": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.130.gate_proj.weight_scale": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.130.up_proj.weight": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.130.up_proj.weight_scale": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.131.down_proj.weight": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.131.down_proj.weight_scale": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.131.gate_proj.weight": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.131.gate_proj.weight_scale": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.131.up_proj.weight": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.131.up_proj.weight_scale": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.132.down_proj.weight": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.132.down_proj.weight_scale": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.132.gate_proj.weight": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.132.gate_proj.weight_scale": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.132.up_proj.weight": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.132.up_proj.weight_scale": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.133.down_proj.weight": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.133.down_proj.weight_scale": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.133.gate_proj.weight": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.133.gate_proj.weight_scale": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.133.up_proj.weight": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.133.up_proj.weight_scale": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.134.down_proj.weight": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.134.down_proj.weight_scale": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.134.gate_proj.weight": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.134.gate_proj.weight_scale": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.134.up_proj.weight": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.134.up_proj.weight_scale": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.135.down_proj.weight": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.135.down_proj.weight_scale": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.135.gate_proj.weight": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.135.gate_proj.weight_scale": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.135.up_proj.weight": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.135.up_proj.weight_scale": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.136.down_proj.weight": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.136.down_proj.weight_scale": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.136.gate_proj.weight": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.136.gate_proj.weight_scale": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.136.up_proj.weight": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.136.up_proj.weight_scale": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.137.down_proj.weight": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.137.down_proj.weight_scale": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.137.gate_proj.weight": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.137.gate_proj.weight_scale": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.137.up_proj.weight": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.137.up_proj.weight_scale": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.138.down_proj.weight": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.138.down_proj.weight_scale": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.138.gate_proj.weight": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.138.gate_proj.weight_scale": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.138.up_proj.weight": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.138.up_proj.weight_scale": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.139.down_proj.weight": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.139.down_proj.weight_scale": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.139.gate_proj.weight": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.139.gate_proj.weight_scale": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.139.up_proj.weight": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.139.up_proj.weight_scale": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.14.down_proj.weight": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.14.down_proj.weight_scale": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.14.gate_proj.weight": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.14.gate_proj.weight_scale": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.14.up_proj.weight": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.14.up_proj.weight_scale": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.140.down_proj.weight": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.140.down_proj.weight_scale": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.140.gate_proj.weight": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.140.gate_proj.weight_scale": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.140.up_proj.weight": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.140.up_proj.weight_scale": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.141.down_proj.weight": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.141.down_proj.weight_scale": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.141.gate_proj.weight": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.141.gate_proj.weight_scale": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.141.up_proj.weight": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.141.up_proj.weight_scale": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.142.down_proj.weight": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.142.down_proj.weight_scale": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.142.gate_proj.weight": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.142.gate_proj.weight_scale": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.142.up_proj.weight": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.142.up_proj.weight_scale": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.143.down_proj.weight": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.143.down_proj.weight_scale": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.143.gate_proj.weight": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.143.gate_proj.weight_scale": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.143.up_proj.weight": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.143.up_proj.weight_scale": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.144.down_proj.weight": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.144.down_proj.weight_scale": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.144.gate_proj.weight": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.144.gate_proj.weight_scale": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.144.up_proj.weight": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.144.up_proj.weight_scale": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.145.down_proj.weight": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.145.down_proj.weight_scale": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.145.gate_proj.weight": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.145.gate_proj.weight_scale": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.145.up_proj.weight": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.145.up_proj.weight_scale": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.146.down_proj.weight": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.146.down_proj.weight_scale": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.146.gate_proj.weight": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.146.gate_proj.weight_scale": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.146.up_proj.weight": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.146.up_proj.weight_scale": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.147.down_proj.weight": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.147.down_proj.weight_scale": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.147.gate_proj.weight": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.147.gate_proj.weight_scale": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.147.up_proj.weight": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.147.up_proj.weight_scale": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.148.down_proj.weight": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.148.down_proj.weight_scale": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.148.gate_proj.weight": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.148.gate_proj.weight_scale": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.148.up_proj.weight": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.148.up_proj.weight_scale": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.149.down_proj.weight": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.149.down_proj.weight_scale": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.149.gate_proj.weight": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.149.gate_proj.weight_scale": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.149.up_proj.weight": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.149.up_proj.weight_scale": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.15.down_proj.weight": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.15.down_proj.weight_scale": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.15.gate_proj.weight": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.15.gate_proj.weight_scale": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.15.up_proj.weight": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.15.up_proj.weight_scale": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.150.down_proj.weight": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.150.down_proj.weight_scale": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.150.gate_proj.weight": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.150.gate_proj.weight_scale": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.150.up_proj.weight": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.150.up_proj.weight_scale": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.151.down_proj.weight": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.151.down_proj.weight_scale": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.151.gate_proj.weight": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.151.gate_proj.weight_scale": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.151.up_proj.weight": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.151.up_proj.weight_scale": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.152.down_proj.weight": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.152.down_proj.weight_scale": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.152.gate_proj.weight": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.152.gate_proj.weight_scale": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.152.up_proj.weight": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.152.up_proj.weight_scale": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.153.down_proj.weight": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.153.down_proj.weight_scale": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.153.gate_proj.weight": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.153.gate_proj.weight_scale": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.153.up_proj.weight": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.153.up_proj.weight_scale": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.154.down_proj.weight": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.154.down_proj.weight_scale": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.154.gate_proj.weight": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.154.gate_proj.weight_scale": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.154.up_proj.weight": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.154.up_proj.weight_scale": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.155.down_proj.weight": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.155.down_proj.weight_scale": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.155.gate_proj.weight": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.155.gate_proj.weight_scale": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.155.up_proj.weight": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.155.up_proj.weight_scale": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.156.down_proj.weight": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.156.down_proj.weight_scale": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.156.gate_proj.weight": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.156.gate_proj.weight_scale": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.156.up_proj.weight": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.156.up_proj.weight_scale": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.157.down_proj.weight": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.157.down_proj.weight_scale": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.157.gate_proj.weight": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.157.gate_proj.weight_scale": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.157.up_proj.weight": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.157.up_proj.weight_scale": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.158.down_proj.weight": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.158.down_proj.weight_scale": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.158.gate_proj.weight": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.158.gate_proj.weight_scale": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.158.up_proj.weight": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.158.up_proj.weight_scale": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.159.down_proj.weight": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.159.down_proj.weight_scale": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.159.gate_proj.weight": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.159.gate_proj.weight_scale": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.159.up_proj.weight": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.159.up_proj.weight_scale": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.16.down_proj.weight": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.16.down_proj.weight_scale": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.16.gate_proj.weight": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.16.gate_proj.weight_scale": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.16.up_proj.weight": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.16.up_proj.weight_scale": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.17.down_proj.weight": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.17.down_proj.weight_scale": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.17.gate_proj.weight": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.17.gate_proj.weight_scale": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.17.up_proj.weight": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.17.up_proj.weight_scale": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.18.down_proj.weight": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.18.down_proj.weight_scale": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.18.gate_proj.weight": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.18.gate_proj.weight_scale": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.18.up_proj.weight": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.18.up_proj.weight_scale": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.19.down_proj.weight": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.19.down_proj.weight_scale": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.19.gate_proj.weight": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.19.gate_proj.weight_scale": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.19.up_proj.weight": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.19.up_proj.weight_scale": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.2.down_proj.weight": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.2.down_proj.weight_scale": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.2.gate_proj.weight": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.2.gate_proj.weight_scale": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.2.up_proj.weight": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.2.up_proj.weight_scale": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.20.down_proj.weight": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.20.down_proj.weight_scale": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.20.gate_proj.weight": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.20.gate_proj.weight_scale": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.20.up_proj.weight": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.20.up_proj.weight_scale": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.21.down_proj.weight": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.21.down_proj.weight_scale": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.21.gate_proj.weight": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.21.gate_proj.weight_scale": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.21.up_proj.weight": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.21.up_proj.weight_scale": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.22.down_proj.weight": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.22.down_proj.weight_scale": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.22.gate_proj.weight": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.22.gate_proj.weight_scale": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.22.up_proj.weight": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.22.up_proj.weight_scale": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.23.down_proj.weight": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.23.down_proj.weight_scale": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.23.gate_proj.weight": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.23.gate_proj.weight_scale": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.23.up_proj.weight": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.23.up_proj.weight_scale": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.24.down_proj.weight": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.24.down_proj.weight_scale": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.24.gate_proj.weight": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.24.gate_proj.weight_scale": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.24.up_proj.weight": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.24.up_proj.weight_scale": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.25.down_proj.weight": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.25.down_proj.weight_scale": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.25.gate_proj.weight": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.25.gate_proj.weight_scale": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.25.up_proj.weight": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.25.up_proj.weight_scale": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.26.down_proj.weight": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.26.down_proj.weight_scale": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.26.gate_proj.weight": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.26.gate_proj.weight_scale": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.26.up_proj.weight": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.26.up_proj.weight_scale": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.27.down_proj.weight": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.27.down_proj.weight_scale": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.27.gate_proj.weight": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.27.gate_proj.weight_scale": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.27.up_proj.weight": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.27.up_proj.weight_scale": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.28.down_proj.weight": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.28.down_proj.weight_scale": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.28.gate_proj.weight": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.28.gate_proj.weight_scale": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.28.up_proj.weight": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.28.up_proj.weight_scale": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.29.down_proj.weight": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.29.down_proj.weight_scale": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.29.gate_proj.weight": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.29.gate_proj.weight_scale": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.29.up_proj.weight": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.29.up_proj.weight_scale": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.3.down_proj.weight": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.3.down_proj.weight_scale": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.3.gate_proj.weight": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.3.gate_proj.weight_scale": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.3.up_proj.weight": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.3.up_proj.weight_scale": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.30.down_proj.weight": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.30.down_proj.weight_scale": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.30.gate_proj.weight": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.30.gate_proj.weight_scale": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.30.up_proj.weight": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.30.up_proj.weight_scale": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.31.down_proj.weight": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.31.down_proj.weight_scale": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.31.gate_proj.weight": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.31.gate_proj.weight_scale": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.31.up_proj.weight": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.31.up_proj.weight_scale": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.32.down_proj.weight": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.32.down_proj.weight_scale": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.32.gate_proj.weight": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.32.gate_proj.weight_scale": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.32.up_proj.weight": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.32.up_proj.weight_scale": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.33.down_proj.weight": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.33.down_proj.weight_scale": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.33.gate_proj.weight": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.33.gate_proj.weight_scale": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.33.up_proj.weight": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.33.up_proj.weight_scale": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.34.down_proj.weight": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.34.down_proj.weight_scale": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.34.gate_proj.weight": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.34.gate_proj.weight_scale": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.34.up_proj.weight": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.34.up_proj.weight_scale": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.35.down_proj.weight": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.35.down_proj.weight_scale": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.35.gate_proj.weight": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.35.gate_proj.weight_scale": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.35.up_proj.weight": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.35.up_proj.weight_scale": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.36.down_proj.weight": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.36.down_proj.weight_scale": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.36.gate_proj.weight": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.36.gate_proj.weight_scale": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.36.up_proj.weight": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.36.up_proj.weight_scale": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.37.down_proj.weight": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.37.down_proj.weight_scale": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.37.gate_proj.weight": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.37.gate_proj.weight_scale": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.37.up_proj.weight": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.37.up_proj.weight_scale": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.38.down_proj.weight": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.38.down_proj.weight_scale": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.38.gate_proj.weight": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.38.gate_proj.weight_scale": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.38.up_proj.weight": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.38.up_proj.weight_scale": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.39.down_proj.weight": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.39.down_proj.weight_scale": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.39.gate_proj.weight": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.39.gate_proj.weight_scale": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.39.up_proj.weight": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.39.up_proj.weight_scale": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.4.down_proj.weight": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.4.down_proj.weight_scale": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.4.gate_proj.weight": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.4.gate_proj.weight_scale": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.4.up_proj.weight": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.4.up_proj.weight_scale": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.40.down_proj.weight": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.40.down_proj.weight_scale": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.40.gate_proj.weight": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.40.gate_proj.weight_scale": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.40.up_proj.weight": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.40.up_proj.weight_scale": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.41.down_proj.weight": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.41.down_proj.weight_scale": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.41.gate_proj.weight": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.41.gate_proj.weight_scale": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.41.up_proj.weight": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.41.up_proj.weight_scale": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.42.down_proj.weight": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.42.down_proj.weight_scale": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.42.gate_proj.weight": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.42.gate_proj.weight_scale": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.42.up_proj.weight": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.42.up_proj.weight_scale": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.43.down_proj.weight": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.43.down_proj.weight_scale": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.43.gate_proj.weight": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.43.gate_proj.weight_scale": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.43.up_proj.weight": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.43.up_proj.weight_scale": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.44.down_proj.weight": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.44.down_proj.weight_scale": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.44.gate_proj.weight": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.44.gate_proj.weight_scale": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.44.up_proj.weight": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.44.up_proj.weight_scale": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.45.down_proj.weight": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.45.down_proj.weight_scale": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.45.gate_proj.weight": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.45.gate_proj.weight_scale": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.45.up_proj.weight": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.45.up_proj.weight_scale": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.46.down_proj.weight": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.46.down_proj.weight_scale": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.46.gate_proj.weight": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.46.gate_proj.weight_scale": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.46.up_proj.weight": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.46.up_proj.weight_scale": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.47.down_proj.weight": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.47.down_proj.weight_scale": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.47.gate_proj.weight": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.47.gate_proj.weight_scale": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.47.up_proj.weight": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.47.up_proj.weight_scale": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.48.down_proj.weight": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.48.down_proj.weight_scale": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.48.gate_proj.weight": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.48.gate_proj.weight_scale": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.48.up_proj.weight": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.48.up_proj.weight_scale": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.49.down_proj.weight": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.49.down_proj.weight_scale": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.49.gate_proj.weight": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.49.gate_proj.weight_scale": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.49.up_proj.weight": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.49.up_proj.weight_scale": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.5.down_proj.weight": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.5.down_proj.weight_scale": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.5.gate_proj.weight": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.5.gate_proj.weight_scale": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.5.up_proj.weight": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.5.up_proj.weight_scale": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.50.down_proj.weight": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.50.down_proj.weight_scale": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.50.gate_proj.weight": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.50.gate_proj.weight_scale": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.50.up_proj.weight": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.50.up_proj.weight_scale": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.51.down_proj.weight": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.51.down_proj.weight_scale": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.51.gate_proj.weight": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.51.gate_proj.weight_scale": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.51.up_proj.weight": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.51.up_proj.weight_scale": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.52.down_proj.weight": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.52.down_proj.weight_scale": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.52.gate_proj.weight": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.52.gate_proj.weight_scale": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.52.up_proj.weight": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.52.up_proj.weight_scale": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.53.down_proj.weight": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.53.down_proj.weight_scale": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.53.gate_proj.weight": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.53.gate_proj.weight_scale": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.53.up_proj.weight": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.53.up_proj.weight_scale": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.54.down_proj.weight": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.54.down_proj.weight_scale": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.54.gate_proj.weight": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.54.gate_proj.weight_scale": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.54.up_proj.weight": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.54.up_proj.weight_scale": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.55.down_proj.weight": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.55.down_proj.weight_scale": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.55.gate_proj.weight": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.55.gate_proj.weight_scale": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.55.up_proj.weight": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.55.up_proj.weight_scale": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.56.down_proj.weight": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.56.down_proj.weight_scale": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.56.gate_proj.weight": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.56.gate_proj.weight_scale": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.56.up_proj.weight": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.56.up_proj.weight_scale": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.57.down_proj.weight": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.57.down_proj.weight_scale": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.57.gate_proj.weight": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.57.gate_proj.weight_scale": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.57.up_proj.weight": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.57.up_proj.weight_scale": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.58.down_proj.weight": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.58.down_proj.weight_scale": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.58.gate_proj.weight": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.58.gate_proj.weight_scale": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.58.up_proj.weight": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.58.up_proj.weight_scale": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.59.down_proj.weight": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.59.down_proj.weight_scale": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.59.gate_proj.weight": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.59.gate_proj.weight_scale": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.59.up_proj.weight": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.59.up_proj.weight_scale": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.6.down_proj.weight": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.6.down_proj.weight_scale": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.6.gate_proj.weight": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.6.gate_proj.weight_scale": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.6.up_proj.weight": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.6.up_proj.weight_scale": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.60.down_proj.weight": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.60.down_proj.weight_scale": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.60.gate_proj.weight": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.60.gate_proj.weight_scale": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.60.up_proj.weight": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.60.up_proj.weight_scale": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.61.down_proj.weight": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.61.down_proj.weight_scale": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.61.gate_proj.weight": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.61.gate_proj.weight_scale": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.61.up_proj.weight": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.61.up_proj.weight_scale": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.62.down_proj.weight": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.62.down_proj.weight_scale": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.62.gate_proj.weight": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.62.gate_proj.weight_scale": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.62.up_proj.weight": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.62.up_proj.weight_scale": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.63.down_proj.weight": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.63.down_proj.weight_scale": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.63.gate_proj.weight": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.63.gate_proj.weight_scale": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.63.up_proj.weight": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.63.up_proj.weight_scale": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.64.down_proj.weight": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.64.down_proj.weight_scale": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.64.gate_proj.weight": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.64.gate_proj.weight_scale": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.64.up_proj.weight": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.64.up_proj.weight_scale": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.65.down_proj.weight": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.65.down_proj.weight_scale": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.65.gate_proj.weight": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.65.gate_proj.weight_scale": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.65.up_proj.weight": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.65.up_proj.weight_scale": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.66.down_proj.weight": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.66.down_proj.weight_scale": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.66.gate_proj.weight": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.66.gate_proj.weight_scale": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.66.up_proj.weight": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.66.up_proj.weight_scale": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.67.down_proj.weight": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.67.down_proj.weight_scale": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.67.gate_proj.weight": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.67.gate_proj.weight_scale": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.67.up_proj.weight": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.67.up_proj.weight_scale": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.68.down_proj.weight": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.68.down_proj.weight_scale": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.68.gate_proj.weight": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.68.gate_proj.weight_scale": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.68.up_proj.weight": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.68.up_proj.weight_scale": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.69.down_proj.weight": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.69.down_proj.weight_scale": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.69.gate_proj.weight": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.69.gate_proj.weight_scale": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.69.up_proj.weight": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.69.up_proj.weight_scale": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.7.down_proj.weight": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.7.down_proj.weight_scale": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.7.gate_proj.weight": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.7.gate_proj.weight_scale": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.7.up_proj.weight": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.7.up_proj.weight_scale": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.70.down_proj.weight": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.70.down_proj.weight_scale": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.70.gate_proj.weight": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.70.gate_proj.weight_scale": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.70.up_proj.weight": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.70.up_proj.weight_scale": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.71.down_proj.weight": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.71.down_proj.weight_scale": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.71.gate_proj.weight": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.71.gate_proj.weight_scale": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.71.up_proj.weight": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.71.up_proj.weight_scale": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.72.down_proj.weight": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.72.down_proj.weight_scale": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.72.gate_proj.weight": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.72.gate_proj.weight_scale": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.72.up_proj.weight": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.72.up_proj.weight_scale": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.73.down_proj.weight": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.73.down_proj.weight_scale": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.73.gate_proj.weight": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.73.gate_proj.weight_scale": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.73.up_proj.weight": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.73.up_proj.weight_scale": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.74.down_proj.weight": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.74.down_proj.weight_scale": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.74.gate_proj.weight": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.74.gate_proj.weight_scale": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.74.up_proj.weight": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.74.up_proj.weight_scale": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.75.down_proj.weight": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.75.down_proj.weight_scale": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.75.gate_proj.weight": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.75.gate_proj.weight_scale": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.75.up_proj.weight": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.75.up_proj.weight_scale": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.76.down_proj.weight": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.76.down_proj.weight_scale": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.76.gate_proj.weight": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.76.gate_proj.weight_scale": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.76.up_proj.weight": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.76.up_proj.weight_scale": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.77.down_proj.weight": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.77.down_proj.weight_scale": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.77.gate_proj.weight": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.77.gate_proj.weight_scale": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.77.up_proj.weight": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.77.up_proj.weight_scale": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.78.down_proj.weight": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.78.down_proj.weight_scale": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.78.gate_proj.weight": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.78.gate_proj.weight_scale": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.78.up_proj.weight": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.78.up_proj.weight_scale": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.79.down_proj.weight": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.79.down_proj.weight_scale": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.79.gate_proj.weight": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.79.gate_proj.weight_scale": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.79.up_proj.weight": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.79.up_proj.weight_scale": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.8.down_proj.weight": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.8.down_proj.weight_scale": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.8.gate_proj.weight": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.8.gate_proj.weight_scale": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.8.up_proj.weight": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.8.up_proj.weight_scale": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.80.down_proj.weight": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.80.down_proj.weight_scale": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.80.gate_proj.weight": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.80.gate_proj.weight_scale": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.80.up_proj.weight": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.80.up_proj.weight_scale": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.81.down_proj.weight": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.81.down_proj.weight_scale": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.81.gate_proj.weight": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.81.gate_proj.weight_scale": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.81.up_proj.weight": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.81.up_proj.weight_scale": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.82.down_proj.weight": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.82.down_proj.weight_scale": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.82.gate_proj.weight": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.82.gate_proj.weight_scale": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.82.up_proj.weight": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.82.up_proj.weight_scale": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.83.down_proj.weight": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.83.down_proj.weight_scale": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.83.gate_proj.weight": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.83.gate_proj.weight_scale": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.83.up_proj.weight": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.83.up_proj.weight_scale": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.84.down_proj.weight": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.84.down_proj.weight_scale": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.84.gate_proj.weight": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.84.gate_proj.weight_scale": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.84.up_proj.weight": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.84.up_proj.weight_scale": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.85.down_proj.weight": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.85.down_proj.weight_scale": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.85.gate_proj.weight": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.85.gate_proj.weight_scale": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.85.up_proj.weight": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.85.up_proj.weight_scale": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.86.down_proj.weight": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.86.down_proj.weight_scale": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.86.gate_proj.weight": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.86.gate_proj.weight_scale": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.86.up_proj.weight": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.86.up_proj.weight_scale": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.87.down_proj.weight": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.87.down_proj.weight_scale": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.87.gate_proj.weight": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.87.gate_proj.weight_scale": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.87.up_proj.weight": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.87.up_proj.weight_scale": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.88.down_proj.weight": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.88.down_proj.weight_scale": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.88.gate_proj.weight": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.88.gate_proj.weight_scale": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.88.up_proj.weight": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.88.up_proj.weight_scale": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.89.down_proj.weight": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.89.down_proj.weight_scale": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.89.gate_proj.weight": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.89.gate_proj.weight_scale": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.89.up_proj.weight": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.89.up_proj.weight_scale": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.9.down_proj.weight": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.9.down_proj.weight_scale": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.9.gate_proj.weight": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.9.gate_proj.weight_scale": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.9.up_proj.weight": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.9.up_proj.weight_scale": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.90.down_proj.weight": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.90.down_proj.weight_scale": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.90.gate_proj.weight": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.90.gate_proj.weight_scale": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.90.up_proj.weight": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.90.up_proj.weight_scale": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.91.down_proj.weight": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.91.down_proj.weight_scale": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.91.gate_proj.weight": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.91.gate_proj.weight_scale": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.91.up_proj.weight": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.91.up_proj.weight_scale": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.92.down_proj.weight": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.92.down_proj.weight_scale": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.92.gate_proj.weight": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.92.gate_proj.weight_scale": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.92.up_proj.weight": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.92.up_proj.weight_scale": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.93.down_proj.weight": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.93.down_proj.weight_scale": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.93.gate_proj.weight": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.93.gate_proj.weight_scale": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.93.up_proj.weight": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.93.up_proj.weight_scale": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.94.down_proj.weight": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.94.down_proj.weight_scale": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.94.gate_proj.weight": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.94.gate_proj.weight_scale": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.94.up_proj.weight": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.94.up_proj.weight_scale": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.95.down_proj.weight": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.95.down_proj.weight_scale": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.95.gate_proj.weight": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.95.gate_proj.weight_scale": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.95.up_proj.weight": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.95.up_proj.weight_scale": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.96.down_proj.weight": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.96.down_proj.weight_scale": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.96.gate_proj.weight": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.96.gate_proj.weight_scale": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.96.up_proj.weight": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.96.up_proj.weight_scale": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.97.down_proj.weight": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.97.down_proj.weight_scale": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.97.gate_proj.weight": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.97.gate_proj.weight_scale": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.97.up_proj.weight": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.97.up_proj.weight_scale": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.98.down_proj.weight": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.98.down_proj.weight_scale": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.98.gate_proj.weight": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.98.gate_proj.weight_scale": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.98.up_proj.weight": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.98.up_proj.weight_scale": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.99.down_proj.weight": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.99.down_proj.weight_scale": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.99.gate_proj.weight": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.99.gate_proj.weight_scale": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.99.up_proj.weight": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.99.up_proj.weight_scale": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.gate.e_score_correction_bias": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.gate.weight": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.shared_experts.down_proj.weight": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.shared_experts.down_proj.weight_scale": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.shared_experts.gate_proj.weight": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.shared_experts.gate_proj.weight_scale": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.shared_experts.up_proj.weight": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.shared_experts.up_proj.weight_scale": "model-00068-of-00092.safetensors",
+ "model.layers.67.post_attention_layernorm.weight": "model-00068-of-00092.safetensors",
+ "model.layers.67.self_attn.k_norm.weight": "model-00068-of-00092.safetensors",
+ "model.layers.67.self_attn.k_proj.bias": "model-00068-of-00092.safetensors",
+ "model.layers.67.self_attn.k_proj.weight": "model-00068-of-00092.safetensors",
+ "model.layers.67.self_attn.k_proj.weight_scale": "model-00068-of-00092.safetensors",
+ "model.layers.67.self_attn.o_proj.weight": "model-00068-of-00092.safetensors",
+ "model.layers.67.self_attn.o_proj.weight_scale": "model-00068-of-00092.safetensors",
+ "model.layers.67.self_attn.q_norm.weight": "model-00068-of-00092.safetensors",
+ "model.layers.67.self_attn.q_proj.bias": "model-00068-of-00092.safetensors",
+ "model.layers.67.self_attn.q_proj.weight": "model-00068-of-00092.safetensors",
+ "model.layers.67.self_attn.q_proj.weight_scale": "model-00068-of-00092.safetensors",
+ "model.layers.67.self_attn.v_proj.bias": "model-00068-of-00092.safetensors",
+ "model.layers.67.self_attn.v_proj.weight": "model-00068-of-00092.safetensors",
+ "model.layers.67.self_attn.v_proj.weight_scale": "model-00068-of-00092.safetensors",
+ "model.layers.68.input_layernorm.weight": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.0.down_proj.weight": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.0.down_proj.weight_scale": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.0.gate_proj.weight": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.0.gate_proj.weight_scale": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.0.up_proj.weight": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.0.up_proj.weight_scale": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.1.down_proj.weight": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.1.down_proj.weight_scale": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.1.gate_proj.weight": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.1.gate_proj.weight_scale": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.1.up_proj.weight": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.1.up_proj.weight_scale": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.10.down_proj.weight": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.10.down_proj.weight_scale": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.10.gate_proj.weight": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.10.gate_proj.weight_scale": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.10.up_proj.weight": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.10.up_proj.weight_scale": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.100.down_proj.weight": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.100.down_proj.weight_scale": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.100.gate_proj.weight": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.100.gate_proj.weight_scale": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.100.up_proj.weight": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.100.up_proj.weight_scale": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.101.down_proj.weight": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.101.down_proj.weight_scale": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.101.gate_proj.weight": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.101.gate_proj.weight_scale": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.101.up_proj.weight": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.101.up_proj.weight_scale": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.102.down_proj.weight": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.102.down_proj.weight_scale": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.102.gate_proj.weight": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.102.gate_proj.weight_scale": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.102.up_proj.weight": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.102.up_proj.weight_scale": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.103.down_proj.weight": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.103.down_proj.weight_scale": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.103.gate_proj.weight": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.103.gate_proj.weight_scale": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.103.up_proj.weight": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.103.up_proj.weight_scale": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.104.down_proj.weight": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.104.down_proj.weight_scale": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.104.gate_proj.weight": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.104.gate_proj.weight_scale": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.104.up_proj.weight": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.104.up_proj.weight_scale": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.105.down_proj.weight": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.105.down_proj.weight_scale": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.105.gate_proj.weight": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.105.gate_proj.weight_scale": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.105.up_proj.weight": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.105.up_proj.weight_scale": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.106.down_proj.weight": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.106.down_proj.weight_scale": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.106.gate_proj.weight": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.106.gate_proj.weight_scale": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.106.up_proj.weight": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.106.up_proj.weight_scale": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.107.down_proj.weight": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.107.down_proj.weight_scale": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.107.gate_proj.weight": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.107.gate_proj.weight_scale": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.107.up_proj.weight": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.107.up_proj.weight_scale": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.108.down_proj.weight": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.108.down_proj.weight_scale": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.108.gate_proj.weight": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.108.gate_proj.weight_scale": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.108.up_proj.weight": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.108.up_proj.weight_scale": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.109.down_proj.weight": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.109.down_proj.weight_scale": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.109.gate_proj.weight": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.109.gate_proj.weight_scale": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.109.up_proj.weight": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.109.up_proj.weight_scale": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.11.down_proj.weight": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.11.down_proj.weight_scale": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.11.gate_proj.weight": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.11.gate_proj.weight_scale": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.11.up_proj.weight": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.11.up_proj.weight_scale": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.110.down_proj.weight": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.110.down_proj.weight_scale": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.110.gate_proj.weight": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.110.gate_proj.weight_scale": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.110.up_proj.weight": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.110.up_proj.weight_scale": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.111.down_proj.weight": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.111.down_proj.weight_scale": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.111.gate_proj.weight": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.111.gate_proj.weight_scale": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.111.up_proj.weight": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.111.up_proj.weight_scale": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.112.down_proj.weight": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.112.down_proj.weight_scale": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.112.gate_proj.weight": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.112.gate_proj.weight_scale": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.112.up_proj.weight": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.112.up_proj.weight_scale": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.113.down_proj.weight": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.113.down_proj.weight_scale": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.113.gate_proj.weight": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.113.gate_proj.weight_scale": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.113.up_proj.weight": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.113.up_proj.weight_scale": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.114.down_proj.weight": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.114.down_proj.weight_scale": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.114.gate_proj.weight": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.114.gate_proj.weight_scale": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.114.up_proj.weight": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.114.up_proj.weight_scale": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.115.down_proj.weight": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.115.down_proj.weight_scale": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.115.gate_proj.weight": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.115.gate_proj.weight_scale": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.115.up_proj.weight": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.115.up_proj.weight_scale": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.116.down_proj.weight": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.116.down_proj.weight_scale": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.116.gate_proj.weight": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.116.gate_proj.weight_scale": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.116.up_proj.weight": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.116.up_proj.weight_scale": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.117.down_proj.weight": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.117.down_proj.weight_scale": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.117.gate_proj.weight": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.117.gate_proj.weight_scale": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.117.up_proj.weight": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.117.up_proj.weight_scale": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.118.down_proj.weight": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.118.down_proj.weight_scale": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.118.gate_proj.weight": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.118.gate_proj.weight_scale": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.118.up_proj.weight": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.118.up_proj.weight_scale": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.119.down_proj.weight": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.119.down_proj.weight_scale": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.119.gate_proj.weight": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.119.gate_proj.weight_scale": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.119.up_proj.weight": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.119.up_proj.weight_scale": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.12.down_proj.weight": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.12.down_proj.weight_scale": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.12.gate_proj.weight": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.12.gate_proj.weight_scale": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.12.up_proj.weight": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.12.up_proj.weight_scale": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.120.down_proj.weight": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.120.down_proj.weight_scale": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.120.gate_proj.weight": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.120.gate_proj.weight_scale": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.120.up_proj.weight": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.120.up_proj.weight_scale": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.121.down_proj.weight": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.121.down_proj.weight_scale": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.121.gate_proj.weight": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.121.gate_proj.weight_scale": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.121.up_proj.weight": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.121.up_proj.weight_scale": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.122.down_proj.weight": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.122.down_proj.weight_scale": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.122.gate_proj.weight": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.122.gate_proj.weight_scale": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.122.up_proj.weight": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.122.up_proj.weight_scale": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.123.down_proj.weight": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.123.down_proj.weight_scale": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.123.gate_proj.weight": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.123.gate_proj.weight_scale": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.123.up_proj.weight": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.123.up_proj.weight_scale": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.124.down_proj.weight": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.124.down_proj.weight_scale": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.124.gate_proj.weight": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.124.gate_proj.weight_scale": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.124.up_proj.weight": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.124.up_proj.weight_scale": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.125.down_proj.weight": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.125.down_proj.weight_scale": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.125.gate_proj.weight": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.125.gate_proj.weight_scale": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.125.up_proj.weight": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.125.up_proj.weight_scale": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.126.down_proj.weight": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.126.down_proj.weight_scale": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.126.gate_proj.weight": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.126.gate_proj.weight_scale": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.126.up_proj.weight": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.126.up_proj.weight_scale": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.127.down_proj.weight": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.127.down_proj.weight_scale": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.127.gate_proj.weight": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.127.gate_proj.weight_scale": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.127.up_proj.weight": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.127.up_proj.weight_scale": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.128.down_proj.weight": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.128.down_proj.weight_scale": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.128.gate_proj.weight": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.128.gate_proj.weight_scale": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.128.up_proj.weight": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.128.up_proj.weight_scale": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.129.down_proj.weight": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.129.down_proj.weight_scale": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.129.gate_proj.weight": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.129.gate_proj.weight_scale": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.129.up_proj.weight": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.129.up_proj.weight_scale": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.13.down_proj.weight": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.13.down_proj.weight_scale": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.13.gate_proj.weight": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.13.gate_proj.weight_scale": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.13.up_proj.weight": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.13.up_proj.weight_scale": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.130.down_proj.weight": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.130.down_proj.weight_scale": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.130.gate_proj.weight": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.130.gate_proj.weight_scale": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.130.up_proj.weight": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.130.up_proj.weight_scale": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.131.down_proj.weight": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.131.down_proj.weight_scale": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.131.gate_proj.weight": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.131.gate_proj.weight_scale": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.131.up_proj.weight": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.131.up_proj.weight_scale": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.132.down_proj.weight": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.132.down_proj.weight_scale": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.132.gate_proj.weight": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.132.gate_proj.weight_scale": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.132.up_proj.weight": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.132.up_proj.weight_scale": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.133.down_proj.weight": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.133.down_proj.weight_scale": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.133.gate_proj.weight": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.133.gate_proj.weight_scale": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.133.up_proj.weight": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.133.up_proj.weight_scale": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.134.down_proj.weight": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.134.down_proj.weight_scale": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.134.gate_proj.weight": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.134.gate_proj.weight_scale": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.134.up_proj.weight": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.134.up_proj.weight_scale": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.135.down_proj.weight": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.135.down_proj.weight_scale": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.135.gate_proj.weight": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.135.gate_proj.weight_scale": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.135.up_proj.weight": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.135.up_proj.weight_scale": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.136.down_proj.weight": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.136.down_proj.weight_scale": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.136.gate_proj.weight": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.136.gate_proj.weight_scale": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.136.up_proj.weight": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.136.up_proj.weight_scale": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.137.down_proj.weight": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.137.down_proj.weight_scale": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.137.gate_proj.weight": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.137.gate_proj.weight_scale": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.137.up_proj.weight": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.137.up_proj.weight_scale": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.138.down_proj.weight": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.138.down_proj.weight_scale": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.138.gate_proj.weight": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.138.gate_proj.weight_scale": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.138.up_proj.weight": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.138.up_proj.weight_scale": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.139.down_proj.weight": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.139.down_proj.weight_scale": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.139.gate_proj.weight": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.139.gate_proj.weight_scale": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.139.up_proj.weight": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.139.up_proj.weight_scale": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.14.down_proj.weight": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.14.down_proj.weight_scale": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.14.gate_proj.weight": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.14.gate_proj.weight_scale": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.14.up_proj.weight": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.14.up_proj.weight_scale": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.140.down_proj.weight": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.140.down_proj.weight_scale": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.140.gate_proj.weight": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.140.gate_proj.weight_scale": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.140.up_proj.weight": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.140.up_proj.weight_scale": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.141.down_proj.weight": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.141.down_proj.weight_scale": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.141.gate_proj.weight": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.141.gate_proj.weight_scale": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.141.up_proj.weight": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.141.up_proj.weight_scale": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.142.down_proj.weight": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.142.down_proj.weight_scale": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.142.gate_proj.weight": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.142.gate_proj.weight_scale": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.142.up_proj.weight": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.142.up_proj.weight_scale": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.143.down_proj.weight": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.143.down_proj.weight_scale": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.143.gate_proj.weight": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.143.gate_proj.weight_scale": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.143.up_proj.weight": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.143.up_proj.weight_scale": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.144.down_proj.weight": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.144.down_proj.weight_scale": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.144.gate_proj.weight": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.144.gate_proj.weight_scale": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.144.up_proj.weight": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.144.up_proj.weight_scale": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.145.down_proj.weight": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.145.down_proj.weight_scale": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.145.gate_proj.weight": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.145.gate_proj.weight_scale": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.145.up_proj.weight": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.145.up_proj.weight_scale": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.146.down_proj.weight": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.146.down_proj.weight_scale": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.146.gate_proj.weight": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.146.gate_proj.weight_scale": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.146.up_proj.weight": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.146.up_proj.weight_scale": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.147.down_proj.weight": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.147.down_proj.weight_scale": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.147.gate_proj.weight": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.147.gate_proj.weight_scale": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.147.up_proj.weight": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.147.up_proj.weight_scale": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.148.down_proj.weight": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.148.down_proj.weight_scale": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.148.gate_proj.weight": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.148.gate_proj.weight_scale": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.148.up_proj.weight": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.148.up_proj.weight_scale": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.149.down_proj.weight": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.149.down_proj.weight_scale": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.149.gate_proj.weight": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.149.gate_proj.weight_scale": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.149.up_proj.weight": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.149.up_proj.weight_scale": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.15.down_proj.weight": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.15.down_proj.weight_scale": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.15.gate_proj.weight": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.15.gate_proj.weight_scale": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.15.up_proj.weight": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.15.up_proj.weight_scale": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.150.down_proj.weight": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.150.down_proj.weight_scale": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.150.gate_proj.weight": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.150.gate_proj.weight_scale": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.150.up_proj.weight": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.150.up_proj.weight_scale": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.151.down_proj.weight": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.151.down_proj.weight_scale": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.151.gate_proj.weight": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.151.gate_proj.weight_scale": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.151.up_proj.weight": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.151.up_proj.weight_scale": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.152.down_proj.weight": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.152.down_proj.weight_scale": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.152.gate_proj.weight": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.152.gate_proj.weight_scale": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.152.up_proj.weight": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.152.up_proj.weight_scale": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.153.down_proj.weight": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.153.down_proj.weight_scale": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.153.gate_proj.weight": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.153.gate_proj.weight_scale": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.153.up_proj.weight": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.153.up_proj.weight_scale": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.154.down_proj.weight": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.154.down_proj.weight_scale": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.154.gate_proj.weight": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.154.gate_proj.weight_scale": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.154.up_proj.weight": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.154.up_proj.weight_scale": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.155.down_proj.weight": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.155.down_proj.weight_scale": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.155.gate_proj.weight": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.155.gate_proj.weight_scale": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.155.up_proj.weight": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.155.up_proj.weight_scale": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.156.down_proj.weight": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.156.down_proj.weight_scale": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.156.gate_proj.weight": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.156.gate_proj.weight_scale": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.156.up_proj.weight": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.156.up_proj.weight_scale": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.157.down_proj.weight": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.157.down_proj.weight_scale": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.157.gate_proj.weight": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.157.gate_proj.weight_scale": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.157.up_proj.weight": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.157.up_proj.weight_scale": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.158.down_proj.weight": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.158.down_proj.weight_scale": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.158.gate_proj.weight": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.158.gate_proj.weight_scale": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.158.up_proj.weight": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.158.up_proj.weight_scale": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.159.down_proj.weight": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.159.down_proj.weight_scale": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.159.gate_proj.weight": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.159.gate_proj.weight_scale": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.159.up_proj.weight": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.159.up_proj.weight_scale": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.16.down_proj.weight": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.16.down_proj.weight_scale": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.16.gate_proj.weight": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.16.gate_proj.weight_scale": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.16.up_proj.weight": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.16.up_proj.weight_scale": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.17.down_proj.weight": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.17.down_proj.weight_scale": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.17.gate_proj.weight": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.17.gate_proj.weight_scale": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.17.up_proj.weight": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.17.up_proj.weight_scale": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.18.down_proj.weight": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.18.down_proj.weight_scale": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.18.gate_proj.weight": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.18.gate_proj.weight_scale": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.18.up_proj.weight": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.18.up_proj.weight_scale": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.19.down_proj.weight": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.19.down_proj.weight_scale": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.19.gate_proj.weight": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.19.gate_proj.weight_scale": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.19.up_proj.weight": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.19.up_proj.weight_scale": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.2.down_proj.weight": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.2.down_proj.weight_scale": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.2.gate_proj.weight": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.2.gate_proj.weight_scale": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.2.up_proj.weight": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.2.up_proj.weight_scale": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.20.down_proj.weight": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.20.down_proj.weight_scale": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.20.gate_proj.weight": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.20.gate_proj.weight_scale": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.20.up_proj.weight": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.20.up_proj.weight_scale": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.21.down_proj.weight": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.21.down_proj.weight_scale": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.21.gate_proj.weight": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.21.gate_proj.weight_scale": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.21.up_proj.weight": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.21.up_proj.weight_scale": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.22.down_proj.weight": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.22.down_proj.weight_scale": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.22.gate_proj.weight": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.22.gate_proj.weight_scale": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.22.up_proj.weight": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.22.up_proj.weight_scale": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.23.down_proj.weight": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.23.down_proj.weight_scale": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.23.gate_proj.weight": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.23.gate_proj.weight_scale": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.23.up_proj.weight": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.23.up_proj.weight_scale": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.24.down_proj.weight": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.24.down_proj.weight_scale": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.24.gate_proj.weight": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.24.gate_proj.weight_scale": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.24.up_proj.weight": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.24.up_proj.weight_scale": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.25.down_proj.weight": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.25.down_proj.weight_scale": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.25.gate_proj.weight": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.25.gate_proj.weight_scale": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.25.up_proj.weight": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.25.up_proj.weight_scale": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.26.down_proj.weight": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.26.down_proj.weight_scale": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.26.gate_proj.weight": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.26.gate_proj.weight_scale": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.26.up_proj.weight": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.26.up_proj.weight_scale": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.27.down_proj.weight": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.27.down_proj.weight_scale": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.27.gate_proj.weight": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.27.gate_proj.weight_scale": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.27.up_proj.weight": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.27.up_proj.weight_scale": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.28.down_proj.weight": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.28.down_proj.weight_scale": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.28.gate_proj.weight": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.28.gate_proj.weight_scale": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.28.up_proj.weight": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.28.up_proj.weight_scale": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.29.down_proj.weight": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.29.down_proj.weight_scale": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.29.gate_proj.weight": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.29.gate_proj.weight_scale": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.29.up_proj.weight": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.29.up_proj.weight_scale": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.3.down_proj.weight": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.3.down_proj.weight_scale": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.3.gate_proj.weight": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.3.gate_proj.weight_scale": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.3.up_proj.weight": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.3.up_proj.weight_scale": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.30.down_proj.weight": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.30.down_proj.weight_scale": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.30.gate_proj.weight": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.30.gate_proj.weight_scale": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.30.up_proj.weight": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.30.up_proj.weight_scale": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.31.down_proj.weight": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.31.down_proj.weight_scale": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.31.gate_proj.weight": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.31.gate_proj.weight_scale": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.31.up_proj.weight": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.31.up_proj.weight_scale": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.32.down_proj.weight": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.32.down_proj.weight_scale": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.32.gate_proj.weight": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.32.gate_proj.weight_scale": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.32.up_proj.weight": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.32.up_proj.weight_scale": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.33.down_proj.weight": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.33.down_proj.weight_scale": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.33.gate_proj.weight": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.33.gate_proj.weight_scale": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.33.up_proj.weight": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.33.up_proj.weight_scale": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.34.down_proj.weight": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.34.down_proj.weight_scale": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.34.gate_proj.weight": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.34.gate_proj.weight_scale": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.34.up_proj.weight": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.34.up_proj.weight_scale": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.35.down_proj.weight": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.35.down_proj.weight_scale": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.35.gate_proj.weight": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.35.gate_proj.weight_scale": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.35.up_proj.weight": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.35.up_proj.weight_scale": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.36.down_proj.weight": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.36.down_proj.weight_scale": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.36.gate_proj.weight": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.36.gate_proj.weight_scale": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.36.up_proj.weight": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.36.up_proj.weight_scale": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.37.down_proj.weight": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.37.down_proj.weight_scale": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.37.gate_proj.weight": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.37.gate_proj.weight_scale": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.37.up_proj.weight": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.37.up_proj.weight_scale": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.38.down_proj.weight": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.38.down_proj.weight_scale": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.38.gate_proj.weight": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.38.gate_proj.weight_scale": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.38.up_proj.weight": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.38.up_proj.weight_scale": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.39.down_proj.weight": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.39.down_proj.weight_scale": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.39.gate_proj.weight": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.39.gate_proj.weight_scale": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.39.up_proj.weight": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.39.up_proj.weight_scale": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.4.down_proj.weight": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.4.down_proj.weight_scale": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.4.gate_proj.weight": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.4.gate_proj.weight_scale": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.4.up_proj.weight": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.4.up_proj.weight_scale": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.40.down_proj.weight": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.40.down_proj.weight_scale": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.40.gate_proj.weight": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.40.gate_proj.weight_scale": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.40.up_proj.weight": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.40.up_proj.weight_scale": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.41.down_proj.weight": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.41.down_proj.weight_scale": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.41.gate_proj.weight": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.41.gate_proj.weight_scale": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.41.up_proj.weight": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.41.up_proj.weight_scale": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.42.down_proj.weight": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.42.down_proj.weight_scale": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.42.gate_proj.weight": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.42.gate_proj.weight_scale": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.42.up_proj.weight": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.42.up_proj.weight_scale": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.43.down_proj.weight": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.43.down_proj.weight_scale": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.43.gate_proj.weight": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.43.gate_proj.weight_scale": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.43.up_proj.weight": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.43.up_proj.weight_scale": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.44.down_proj.weight": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.44.down_proj.weight_scale": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.44.gate_proj.weight": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.44.gate_proj.weight_scale": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.44.up_proj.weight": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.44.up_proj.weight_scale": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.45.down_proj.weight": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.45.down_proj.weight_scale": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.45.gate_proj.weight": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.45.gate_proj.weight_scale": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.45.up_proj.weight": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.45.up_proj.weight_scale": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.46.down_proj.weight": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.46.down_proj.weight_scale": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.46.gate_proj.weight": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.46.gate_proj.weight_scale": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.46.up_proj.weight": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.46.up_proj.weight_scale": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.47.down_proj.weight": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.47.down_proj.weight_scale": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.47.gate_proj.weight": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.47.gate_proj.weight_scale": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.47.up_proj.weight": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.47.up_proj.weight_scale": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.48.down_proj.weight": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.48.down_proj.weight_scale": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.48.gate_proj.weight": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.48.gate_proj.weight_scale": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.48.up_proj.weight": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.48.up_proj.weight_scale": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.49.down_proj.weight": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.49.down_proj.weight_scale": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.49.gate_proj.weight": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.49.gate_proj.weight_scale": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.49.up_proj.weight": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.49.up_proj.weight_scale": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.5.down_proj.weight": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.5.down_proj.weight_scale": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.5.gate_proj.weight": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.5.gate_proj.weight_scale": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.5.up_proj.weight": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.5.up_proj.weight_scale": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.50.down_proj.weight": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.50.down_proj.weight_scale": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.50.gate_proj.weight": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.50.gate_proj.weight_scale": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.50.up_proj.weight": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.50.up_proj.weight_scale": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.51.down_proj.weight": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.51.down_proj.weight_scale": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.51.gate_proj.weight": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.51.gate_proj.weight_scale": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.51.up_proj.weight": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.51.up_proj.weight_scale": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.52.down_proj.weight": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.52.down_proj.weight_scale": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.52.gate_proj.weight": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.52.gate_proj.weight_scale": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.52.up_proj.weight": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.52.up_proj.weight_scale": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.53.down_proj.weight": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.53.down_proj.weight_scale": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.53.gate_proj.weight": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.53.gate_proj.weight_scale": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.53.up_proj.weight": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.53.up_proj.weight_scale": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.54.down_proj.weight": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.54.down_proj.weight_scale": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.54.gate_proj.weight": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.54.gate_proj.weight_scale": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.54.up_proj.weight": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.54.up_proj.weight_scale": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.55.down_proj.weight": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.55.down_proj.weight_scale": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.55.gate_proj.weight": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.55.gate_proj.weight_scale": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.55.up_proj.weight": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.55.up_proj.weight_scale": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.56.down_proj.weight": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.56.down_proj.weight_scale": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.56.gate_proj.weight": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.56.gate_proj.weight_scale": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.56.up_proj.weight": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.56.up_proj.weight_scale": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.57.down_proj.weight": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.57.down_proj.weight_scale": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.57.gate_proj.weight": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.57.gate_proj.weight_scale": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.57.up_proj.weight": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.57.up_proj.weight_scale": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.58.down_proj.weight": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.58.down_proj.weight_scale": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.58.gate_proj.weight": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.58.gate_proj.weight_scale": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.58.up_proj.weight": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.58.up_proj.weight_scale": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.59.down_proj.weight": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.59.down_proj.weight_scale": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.59.gate_proj.weight": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.59.gate_proj.weight_scale": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.59.up_proj.weight": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.59.up_proj.weight_scale": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.6.down_proj.weight": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.6.down_proj.weight_scale": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.6.gate_proj.weight": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.6.gate_proj.weight_scale": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.6.up_proj.weight": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.6.up_proj.weight_scale": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.60.down_proj.weight": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.60.down_proj.weight_scale": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.60.gate_proj.weight": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.60.gate_proj.weight_scale": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.60.up_proj.weight": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.60.up_proj.weight_scale": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.61.down_proj.weight": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.61.down_proj.weight_scale": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.61.gate_proj.weight": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.61.gate_proj.weight_scale": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.61.up_proj.weight": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.61.up_proj.weight_scale": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.62.down_proj.weight": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.62.down_proj.weight_scale": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.62.gate_proj.weight": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.62.gate_proj.weight_scale": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.62.up_proj.weight": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.62.up_proj.weight_scale": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.63.down_proj.weight": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.63.down_proj.weight_scale": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.63.gate_proj.weight": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.63.gate_proj.weight_scale": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.63.up_proj.weight": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.63.up_proj.weight_scale": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.64.down_proj.weight": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.64.down_proj.weight_scale": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.64.gate_proj.weight": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.64.gate_proj.weight_scale": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.64.up_proj.weight": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.64.up_proj.weight_scale": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.65.down_proj.weight": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.65.down_proj.weight_scale": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.65.gate_proj.weight": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.65.gate_proj.weight_scale": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.65.up_proj.weight": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.65.up_proj.weight_scale": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.66.down_proj.weight": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.66.down_proj.weight_scale": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.66.gate_proj.weight": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.66.gate_proj.weight_scale": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.66.up_proj.weight": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.66.up_proj.weight_scale": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.67.down_proj.weight": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.67.down_proj.weight_scale": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.67.gate_proj.weight": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.67.gate_proj.weight_scale": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.67.up_proj.weight": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.67.up_proj.weight_scale": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.68.down_proj.weight": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.68.down_proj.weight_scale": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.68.gate_proj.weight": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.68.gate_proj.weight_scale": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.68.up_proj.weight": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.68.up_proj.weight_scale": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.69.down_proj.weight": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.69.down_proj.weight_scale": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.69.gate_proj.weight": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.69.gate_proj.weight_scale": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.69.up_proj.weight": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.69.up_proj.weight_scale": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.7.down_proj.weight": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.7.down_proj.weight_scale": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.7.gate_proj.weight": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.7.gate_proj.weight_scale": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.7.up_proj.weight": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.7.up_proj.weight_scale": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.70.down_proj.weight": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.70.down_proj.weight_scale": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.70.gate_proj.weight": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.70.gate_proj.weight_scale": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.70.up_proj.weight": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.70.up_proj.weight_scale": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.71.down_proj.weight": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.71.down_proj.weight_scale": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.71.gate_proj.weight": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.71.gate_proj.weight_scale": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.71.up_proj.weight": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.71.up_proj.weight_scale": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.72.down_proj.weight": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.72.down_proj.weight_scale": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.72.gate_proj.weight": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.72.gate_proj.weight_scale": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.72.up_proj.weight": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.72.up_proj.weight_scale": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.73.down_proj.weight": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.73.down_proj.weight_scale": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.73.gate_proj.weight": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.73.gate_proj.weight_scale": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.73.up_proj.weight": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.73.up_proj.weight_scale": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.74.down_proj.weight": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.74.down_proj.weight_scale": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.74.gate_proj.weight": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.74.gate_proj.weight_scale": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.74.up_proj.weight": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.74.up_proj.weight_scale": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.75.down_proj.weight": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.75.down_proj.weight_scale": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.75.gate_proj.weight": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.75.gate_proj.weight_scale": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.75.up_proj.weight": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.75.up_proj.weight_scale": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.76.down_proj.weight": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.76.down_proj.weight_scale": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.76.gate_proj.weight": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.76.gate_proj.weight_scale": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.76.up_proj.weight": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.76.up_proj.weight_scale": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.77.down_proj.weight": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.77.down_proj.weight_scale": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.77.gate_proj.weight": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.77.gate_proj.weight_scale": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.77.up_proj.weight": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.77.up_proj.weight_scale": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.78.down_proj.weight": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.78.down_proj.weight_scale": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.78.gate_proj.weight": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.78.gate_proj.weight_scale": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.78.up_proj.weight": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.78.up_proj.weight_scale": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.79.down_proj.weight": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.79.down_proj.weight_scale": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.79.gate_proj.weight": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.79.gate_proj.weight_scale": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.79.up_proj.weight": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.79.up_proj.weight_scale": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.8.down_proj.weight": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.8.down_proj.weight_scale": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.8.gate_proj.weight": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.8.gate_proj.weight_scale": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.8.up_proj.weight": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.8.up_proj.weight_scale": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.80.down_proj.weight": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.80.down_proj.weight_scale": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.80.gate_proj.weight": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.80.gate_proj.weight_scale": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.80.up_proj.weight": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.80.up_proj.weight_scale": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.81.down_proj.weight": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.81.down_proj.weight_scale": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.81.gate_proj.weight": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.81.gate_proj.weight_scale": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.81.up_proj.weight": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.81.up_proj.weight_scale": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.82.down_proj.weight": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.82.down_proj.weight_scale": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.82.gate_proj.weight": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.82.gate_proj.weight_scale": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.82.up_proj.weight": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.82.up_proj.weight_scale": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.83.down_proj.weight": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.83.down_proj.weight_scale": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.83.gate_proj.weight": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.83.gate_proj.weight_scale": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.83.up_proj.weight": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.83.up_proj.weight_scale": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.84.down_proj.weight": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.84.down_proj.weight_scale": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.84.gate_proj.weight": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.84.gate_proj.weight_scale": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.84.up_proj.weight": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.84.up_proj.weight_scale": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.85.down_proj.weight": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.85.down_proj.weight_scale": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.85.gate_proj.weight": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.85.gate_proj.weight_scale": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.85.up_proj.weight": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.85.up_proj.weight_scale": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.86.down_proj.weight": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.86.down_proj.weight_scale": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.86.gate_proj.weight": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.86.gate_proj.weight_scale": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.86.up_proj.weight": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.86.up_proj.weight_scale": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.87.down_proj.weight": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.87.down_proj.weight_scale": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.87.gate_proj.weight": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.87.gate_proj.weight_scale": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.87.up_proj.weight": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.87.up_proj.weight_scale": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.88.down_proj.weight": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.88.down_proj.weight_scale": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.88.gate_proj.weight": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.88.gate_proj.weight_scale": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.88.up_proj.weight": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.88.up_proj.weight_scale": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.89.down_proj.weight": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.89.down_proj.weight_scale": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.89.gate_proj.weight": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.89.gate_proj.weight_scale": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.89.up_proj.weight": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.89.up_proj.weight_scale": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.9.down_proj.weight": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.9.down_proj.weight_scale": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.9.gate_proj.weight": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.9.gate_proj.weight_scale": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.9.up_proj.weight": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.9.up_proj.weight_scale": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.90.down_proj.weight": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.90.down_proj.weight_scale": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.90.gate_proj.weight": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.90.gate_proj.weight_scale": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.90.up_proj.weight": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.90.up_proj.weight_scale": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.91.down_proj.weight": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.91.down_proj.weight_scale": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.91.gate_proj.weight": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.91.gate_proj.weight_scale": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.91.up_proj.weight": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.91.up_proj.weight_scale": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.92.down_proj.weight": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.92.down_proj.weight_scale": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.92.gate_proj.weight": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.92.gate_proj.weight_scale": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.92.up_proj.weight": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.92.up_proj.weight_scale": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.93.down_proj.weight": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.93.down_proj.weight_scale": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.93.gate_proj.weight": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.93.gate_proj.weight_scale": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.93.up_proj.weight": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.93.up_proj.weight_scale": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.94.down_proj.weight": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.94.down_proj.weight_scale": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.94.gate_proj.weight": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.94.gate_proj.weight_scale": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.94.up_proj.weight": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.94.up_proj.weight_scale": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.95.down_proj.weight": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.95.down_proj.weight_scale": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.95.gate_proj.weight": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.95.gate_proj.weight_scale": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.95.up_proj.weight": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.95.up_proj.weight_scale": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.96.down_proj.weight": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.96.down_proj.weight_scale": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.96.gate_proj.weight": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.96.gate_proj.weight_scale": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.96.up_proj.weight": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.96.up_proj.weight_scale": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.97.down_proj.weight": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.97.down_proj.weight_scale": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.97.gate_proj.weight": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.97.gate_proj.weight_scale": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.97.up_proj.weight": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.97.up_proj.weight_scale": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.98.down_proj.weight": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.98.down_proj.weight_scale": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.98.gate_proj.weight": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.98.gate_proj.weight_scale": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.98.up_proj.weight": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.98.up_proj.weight_scale": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.99.down_proj.weight": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.99.down_proj.weight_scale": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.99.gate_proj.weight": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.99.gate_proj.weight_scale": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.99.up_proj.weight": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.99.up_proj.weight_scale": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.gate.e_score_correction_bias": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.gate.weight": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.shared_experts.down_proj.weight": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.shared_experts.down_proj.weight_scale": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.shared_experts.gate_proj.weight": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.shared_experts.gate_proj.weight_scale": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.shared_experts.up_proj.weight": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.shared_experts.up_proj.weight_scale": "model-00069-of-00092.safetensors",
+ "model.layers.68.post_attention_layernorm.weight": "model-00069-of-00092.safetensors",
+ "model.layers.68.self_attn.k_norm.weight": "model-00069-of-00092.safetensors",
+ "model.layers.68.self_attn.k_proj.bias": "model-00069-of-00092.safetensors",
+ "model.layers.68.self_attn.k_proj.weight": "model-00069-of-00092.safetensors",
+ "model.layers.68.self_attn.k_proj.weight_scale": "model-00069-of-00092.safetensors",
+ "model.layers.68.self_attn.o_proj.weight": "model-00069-of-00092.safetensors",
+ "model.layers.68.self_attn.o_proj.weight_scale": "model-00069-of-00092.safetensors",
+ "model.layers.68.self_attn.q_norm.weight": "model-00069-of-00092.safetensors",
+ "model.layers.68.self_attn.q_proj.bias": "model-00069-of-00092.safetensors",
+ "model.layers.68.self_attn.q_proj.weight": "model-00069-of-00092.safetensors",
+ "model.layers.68.self_attn.q_proj.weight_scale": "model-00069-of-00092.safetensors",
+ "model.layers.68.self_attn.v_proj.bias": "model-00069-of-00092.safetensors",
+ "model.layers.68.self_attn.v_proj.weight": "model-00069-of-00092.safetensors",
+ "model.layers.68.self_attn.v_proj.weight_scale": "model-00069-of-00092.safetensors",
+ "model.layers.69.input_layernorm.weight": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.0.down_proj.weight": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.0.down_proj.weight_scale": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.0.gate_proj.weight": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.0.gate_proj.weight_scale": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.0.up_proj.weight": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.0.up_proj.weight_scale": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.1.down_proj.weight": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.1.down_proj.weight_scale": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.1.gate_proj.weight": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.1.gate_proj.weight_scale": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.1.up_proj.weight": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.1.up_proj.weight_scale": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.10.down_proj.weight": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.10.down_proj.weight_scale": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.10.gate_proj.weight": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.10.gate_proj.weight_scale": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.10.up_proj.weight": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.10.up_proj.weight_scale": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.100.down_proj.weight": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.100.down_proj.weight_scale": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.100.gate_proj.weight": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.100.gate_proj.weight_scale": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.100.up_proj.weight": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.100.up_proj.weight_scale": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.101.down_proj.weight": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.101.down_proj.weight_scale": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.101.gate_proj.weight": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.101.gate_proj.weight_scale": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.101.up_proj.weight": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.101.up_proj.weight_scale": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.102.down_proj.weight": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.102.down_proj.weight_scale": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.102.gate_proj.weight": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.102.gate_proj.weight_scale": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.102.up_proj.weight": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.102.up_proj.weight_scale": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.103.down_proj.weight": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.103.down_proj.weight_scale": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.103.gate_proj.weight": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.103.gate_proj.weight_scale": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.103.up_proj.weight": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.103.up_proj.weight_scale": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.104.down_proj.weight": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.104.down_proj.weight_scale": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.104.gate_proj.weight": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.104.gate_proj.weight_scale": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.104.up_proj.weight": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.104.up_proj.weight_scale": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.105.down_proj.weight": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.105.down_proj.weight_scale": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.105.gate_proj.weight": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.105.gate_proj.weight_scale": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.105.up_proj.weight": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.105.up_proj.weight_scale": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.106.down_proj.weight": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.106.down_proj.weight_scale": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.106.gate_proj.weight": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.106.gate_proj.weight_scale": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.106.up_proj.weight": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.106.up_proj.weight_scale": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.107.down_proj.weight": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.107.down_proj.weight_scale": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.107.gate_proj.weight": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.107.gate_proj.weight_scale": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.107.up_proj.weight": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.107.up_proj.weight_scale": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.108.down_proj.weight": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.108.down_proj.weight_scale": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.108.gate_proj.weight": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.108.gate_proj.weight_scale": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.108.up_proj.weight": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.108.up_proj.weight_scale": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.109.down_proj.weight": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.109.down_proj.weight_scale": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.109.gate_proj.weight": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.109.gate_proj.weight_scale": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.109.up_proj.weight": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.109.up_proj.weight_scale": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.11.down_proj.weight": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.11.down_proj.weight_scale": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.11.gate_proj.weight": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.11.gate_proj.weight_scale": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.11.up_proj.weight": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.11.up_proj.weight_scale": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.110.down_proj.weight": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.110.down_proj.weight_scale": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.110.gate_proj.weight": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.110.gate_proj.weight_scale": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.110.up_proj.weight": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.110.up_proj.weight_scale": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.111.down_proj.weight": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.111.down_proj.weight_scale": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.111.gate_proj.weight": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.111.gate_proj.weight_scale": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.111.up_proj.weight": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.111.up_proj.weight_scale": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.112.down_proj.weight": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.112.down_proj.weight_scale": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.112.gate_proj.weight": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.112.gate_proj.weight_scale": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.112.up_proj.weight": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.112.up_proj.weight_scale": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.113.down_proj.weight": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.113.down_proj.weight_scale": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.113.gate_proj.weight": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.113.gate_proj.weight_scale": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.113.up_proj.weight": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.113.up_proj.weight_scale": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.114.down_proj.weight": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.114.down_proj.weight_scale": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.114.gate_proj.weight": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.114.gate_proj.weight_scale": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.114.up_proj.weight": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.114.up_proj.weight_scale": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.115.down_proj.weight": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.115.down_proj.weight_scale": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.115.gate_proj.weight": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.115.gate_proj.weight_scale": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.115.up_proj.weight": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.115.up_proj.weight_scale": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.116.down_proj.weight": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.116.down_proj.weight_scale": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.116.gate_proj.weight": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.116.gate_proj.weight_scale": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.116.up_proj.weight": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.116.up_proj.weight_scale": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.117.down_proj.weight": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.117.down_proj.weight_scale": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.117.gate_proj.weight": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.117.gate_proj.weight_scale": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.117.up_proj.weight": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.117.up_proj.weight_scale": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.118.down_proj.weight": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.118.down_proj.weight_scale": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.118.gate_proj.weight": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.118.gate_proj.weight_scale": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.118.up_proj.weight": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.118.up_proj.weight_scale": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.119.down_proj.weight": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.119.down_proj.weight_scale": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.119.gate_proj.weight": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.119.gate_proj.weight_scale": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.119.up_proj.weight": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.119.up_proj.weight_scale": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.12.down_proj.weight": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.12.down_proj.weight_scale": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.12.gate_proj.weight": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.12.gate_proj.weight_scale": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.12.up_proj.weight": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.12.up_proj.weight_scale": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.120.down_proj.weight": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.120.down_proj.weight_scale": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.120.gate_proj.weight": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.120.gate_proj.weight_scale": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.120.up_proj.weight": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.120.up_proj.weight_scale": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.121.down_proj.weight": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.121.down_proj.weight_scale": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.121.gate_proj.weight": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.121.gate_proj.weight_scale": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.121.up_proj.weight": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.121.up_proj.weight_scale": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.122.down_proj.weight": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.122.down_proj.weight_scale": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.122.gate_proj.weight": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.122.gate_proj.weight_scale": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.122.up_proj.weight": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.122.up_proj.weight_scale": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.123.down_proj.weight": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.123.down_proj.weight_scale": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.123.gate_proj.weight": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.123.gate_proj.weight_scale": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.123.up_proj.weight": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.123.up_proj.weight_scale": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.124.down_proj.weight": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.124.down_proj.weight_scale": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.124.gate_proj.weight": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.124.gate_proj.weight_scale": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.124.up_proj.weight": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.124.up_proj.weight_scale": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.125.down_proj.weight": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.125.down_proj.weight_scale": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.125.gate_proj.weight": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.125.gate_proj.weight_scale": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.125.up_proj.weight": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.125.up_proj.weight_scale": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.126.down_proj.weight": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.126.down_proj.weight_scale": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.126.gate_proj.weight": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.126.gate_proj.weight_scale": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.126.up_proj.weight": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.126.up_proj.weight_scale": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.127.down_proj.weight": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.127.down_proj.weight_scale": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.127.gate_proj.weight": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.127.gate_proj.weight_scale": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.127.up_proj.weight": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.127.up_proj.weight_scale": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.128.down_proj.weight": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.128.down_proj.weight_scale": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.128.gate_proj.weight": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.128.gate_proj.weight_scale": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.128.up_proj.weight": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.128.up_proj.weight_scale": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.129.down_proj.weight": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.129.down_proj.weight_scale": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.129.gate_proj.weight": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.129.gate_proj.weight_scale": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.129.up_proj.weight": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.129.up_proj.weight_scale": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.13.down_proj.weight": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.13.down_proj.weight_scale": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.13.gate_proj.weight": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.13.gate_proj.weight_scale": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.13.up_proj.weight": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.13.up_proj.weight_scale": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.130.down_proj.weight": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.130.down_proj.weight_scale": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.130.gate_proj.weight": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.130.gate_proj.weight_scale": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.130.up_proj.weight": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.130.up_proj.weight_scale": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.131.down_proj.weight": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.131.down_proj.weight_scale": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.131.gate_proj.weight": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.131.gate_proj.weight_scale": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.131.up_proj.weight": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.131.up_proj.weight_scale": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.132.down_proj.weight": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.132.down_proj.weight_scale": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.132.gate_proj.weight": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.132.gate_proj.weight_scale": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.132.up_proj.weight": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.132.up_proj.weight_scale": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.133.down_proj.weight": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.133.down_proj.weight_scale": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.133.gate_proj.weight": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.133.gate_proj.weight_scale": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.133.up_proj.weight": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.133.up_proj.weight_scale": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.134.down_proj.weight": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.134.down_proj.weight_scale": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.134.gate_proj.weight": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.134.gate_proj.weight_scale": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.134.up_proj.weight": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.134.up_proj.weight_scale": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.135.down_proj.weight": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.135.down_proj.weight_scale": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.135.gate_proj.weight": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.135.gate_proj.weight_scale": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.135.up_proj.weight": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.135.up_proj.weight_scale": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.136.down_proj.weight": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.136.down_proj.weight_scale": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.136.gate_proj.weight": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.136.gate_proj.weight_scale": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.136.up_proj.weight": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.136.up_proj.weight_scale": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.137.down_proj.weight": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.137.down_proj.weight_scale": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.137.gate_proj.weight": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.137.gate_proj.weight_scale": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.137.up_proj.weight": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.137.up_proj.weight_scale": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.138.down_proj.weight": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.138.down_proj.weight_scale": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.138.gate_proj.weight": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.138.gate_proj.weight_scale": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.138.up_proj.weight": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.138.up_proj.weight_scale": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.139.down_proj.weight": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.139.down_proj.weight_scale": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.139.gate_proj.weight": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.139.gate_proj.weight_scale": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.139.up_proj.weight": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.139.up_proj.weight_scale": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.14.down_proj.weight": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.14.down_proj.weight_scale": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.14.gate_proj.weight": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.14.gate_proj.weight_scale": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.14.up_proj.weight": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.14.up_proj.weight_scale": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.140.down_proj.weight": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.140.down_proj.weight_scale": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.140.gate_proj.weight": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.140.gate_proj.weight_scale": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.140.up_proj.weight": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.140.up_proj.weight_scale": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.141.down_proj.weight": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.141.down_proj.weight_scale": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.141.gate_proj.weight": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.141.gate_proj.weight_scale": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.141.up_proj.weight": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.141.up_proj.weight_scale": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.142.down_proj.weight": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.142.down_proj.weight_scale": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.142.gate_proj.weight": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.142.gate_proj.weight_scale": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.142.up_proj.weight": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.142.up_proj.weight_scale": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.143.down_proj.weight": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.143.down_proj.weight_scale": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.143.gate_proj.weight": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.143.gate_proj.weight_scale": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.143.up_proj.weight": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.143.up_proj.weight_scale": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.144.down_proj.weight": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.144.down_proj.weight_scale": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.144.gate_proj.weight": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.144.gate_proj.weight_scale": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.144.up_proj.weight": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.144.up_proj.weight_scale": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.145.down_proj.weight": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.145.down_proj.weight_scale": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.145.gate_proj.weight": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.145.gate_proj.weight_scale": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.145.up_proj.weight": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.145.up_proj.weight_scale": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.146.down_proj.weight": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.146.down_proj.weight_scale": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.146.gate_proj.weight": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.146.gate_proj.weight_scale": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.146.up_proj.weight": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.146.up_proj.weight_scale": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.147.down_proj.weight": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.147.down_proj.weight_scale": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.147.gate_proj.weight": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.147.gate_proj.weight_scale": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.147.up_proj.weight": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.147.up_proj.weight_scale": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.148.down_proj.weight": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.148.down_proj.weight_scale": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.148.gate_proj.weight": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.148.gate_proj.weight_scale": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.148.up_proj.weight": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.148.up_proj.weight_scale": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.149.down_proj.weight": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.149.down_proj.weight_scale": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.149.gate_proj.weight": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.149.gate_proj.weight_scale": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.149.up_proj.weight": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.149.up_proj.weight_scale": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.15.down_proj.weight": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.15.down_proj.weight_scale": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.15.gate_proj.weight": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.15.gate_proj.weight_scale": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.15.up_proj.weight": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.15.up_proj.weight_scale": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.150.down_proj.weight": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.150.down_proj.weight_scale": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.150.gate_proj.weight": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.150.gate_proj.weight_scale": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.150.up_proj.weight": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.150.up_proj.weight_scale": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.151.down_proj.weight": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.151.down_proj.weight_scale": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.151.gate_proj.weight": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.151.gate_proj.weight_scale": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.151.up_proj.weight": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.151.up_proj.weight_scale": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.152.down_proj.weight": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.152.down_proj.weight_scale": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.152.gate_proj.weight": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.152.gate_proj.weight_scale": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.152.up_proj.weight": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.152.up_proj.weight_scale": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.153.down_proj.weight": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.153.down_proj.weight_scale": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.153.gate_proj.weight": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.153.gate_proj.weight_scale": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.153.up_proj.weight": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.153.up_proj.weight_scale": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.154.down_proj.weight": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.154.down_proj.weight_scale": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.154.gate_proj.weight": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.154.gate_proj.weight_scale": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.154.up_proj.weight": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.154.up_proj.weight_scale": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.155.down_proj.weight": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.155.down_proj.weight_scale": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.155.gate_proj.weight": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.155.gate_proj.weight_scale": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.155.up_proj.weight": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.155.up_proj.weight_scale": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.156.down_proj.weight": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.156.down_proj.weight_scale": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.156.gate_proj.weight": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.156.gate_proj.weight_scale": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.156.up_proj.weight": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.156.up_proj.weight_scale": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.157.down_proj.weight": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.157.down_proj.weight_scale": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.157.gate_proj.weight": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.157.gate_proj.weight_scale": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.157.up_proj.weight": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.157.up_proj.weight_scale": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.158.down_proj.weight": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.158.down_proj.weight_scale": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.158.gate_proj.weight": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.158.gate_proj.weight_scale": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.158.up_proj.weight": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.158.up_proj.weight_scale": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.159.down_proj.weight": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.159.down_proj.weight_scale": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.159.gate_proj.weight": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.159.gate_proj.weight_scale": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.159.up_proj.weight": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.159.up_proj.weight_scale": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.16.down_proj.weight": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.16.down_proj.weight_scale": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.16.gate_proj.weight": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.16.gate_proj.weight_scale": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.16.up_proj.weight": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.16.up_proj.weight_scale": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.17.down_proj.weight": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.17.down_proj.weight_scale": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.17.gate_proj.weight": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.17.gate_proj.weight_scale": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.17.up_proj.weight": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.17.up_proj.weight_scale": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.18.down_proj.weight": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.18.down_proj.weight_scale": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.18.gate_proj.weight": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.18.gate_proj.weight_scale": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.18.up_proj.weight": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.18.up_proj.weight_scale": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.19.down_proj.weight": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.19.down_proj.weight_scale": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.19.gate_proj.weight": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.19.gate_proj.weight_scale": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.19.up_proj.weight": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.19.up_proj.weight_scale": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.2.down_proj.weight": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.2.down_proj.weight_scale": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.2.gate_proj.weight": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.2.gate_proj.weight_scale": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.2.up_proj.weight": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.2.up_proj.weight_scale": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.20.down_proj.weight": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.20.down_proj.weight_scale": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.20.gate_proj.weight": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.20.gate_proj.weight_scale": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.20.up_proj.weight": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.20.up_proj.weight_scale": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.21.down_proj.weight": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.21.down_proj.weight_scale": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.21.gate_proj.weight": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.21.gate_proj.weight_scale": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.21.up_proj.weight": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.21.up_proj.weight_scale": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.22.down_proj.weight": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.22.down_proj.weight_scale": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.22.gate_proj.weight": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.22.gate_proj.weight_scale": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.22.up_proj.weight": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.22.up_proj.weight_scale": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.23.down_proj.weight": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.23.down_proj.weight_scale": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.23.gate_proj.weight": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.23.gate_proj.weight_scale": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.23.up_proj.weight": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.23.up_proj.weight_scale": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.24.down_proj.weight": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.24.down_proj.weight_scale": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.24.gate_proj.weight": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.24.gate_proj.weight_scale": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.24.up_proj.weight": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.24.up_proj.weight_scale": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.25.down_proj.weight": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.25.down_proj.weight_scale": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.25.gate_proj.weight": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.25.gate_proj.weight_scale": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.25.up_proj.weight": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.25.up_proj.weight_scale": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.26.down_proj.weight": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.26.down_proj.weight_scale": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.26.gate_proj.weight": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.26.gate_proj.weight_scale": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.26.up_proj.weight": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.26.up_proj.weight_scale": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.27.down_proj.weight": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.27.down_proj.weight_scale": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.27.gate_proj.weight": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.27.gate_proj.weight_scale": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.27.up_proj.weight": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.27.up_proj.weight_scale": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.28.down_proj.weight": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.28.down_proj.weight_scale": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.28.gate_proj.weight": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.28.gate_proj.weight_scale": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.28.up_proj.weight": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.28.up_proj.weight_scale": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.29.down_proj.weight": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.29.down_proj.weight_scale": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.29.gate_proj.weight": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.29.gate_proj.weight_scale": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.29.up_proj.weight": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.29.up_proj.weight_scale": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.3.down_proj.weight": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.3.down_proj.weight_scale": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.3.gate_proj.weight": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.3.gate_proj.weight_scale": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.3.up_proj.weight": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.3.up_proj.weight_scale": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.30.down_proj.weight": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.30.down_proj.weight_scale": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.30.gate_proj.weight": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.30.gate_proj.weight_scale": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.30.up_proj.weight": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.30.up_proj.weight_scale": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.31.down_proj.weight": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.31.down_proj.weight_scale": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.31.gate_proj.weight": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.31.gate_proj.weight_scale": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.31.up_proj.weight": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.31.up_proj.weight_scale": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.32.down_proj.weight": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.32.down_proj.weight_scale": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.32.gate_proj.weight": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.32.gate_proj.weight_scale": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.32.up_proj.weight": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.32.up_proj.weight_scale": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.33.down_proj.weight": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.33.down_proj.weight_scale": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.33.gate_proj.weight": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.33.gate_proj.weight_scale": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.33.up_proj.weight": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.33.up_proj.weight_scale": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.34.down_proj.weight": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.34.down_proj.weight_scale": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.34.gate_proj.weight": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.34.gate_proj.weight_scale": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.34.up_proj.weight": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.34.up_proj.weight_scale": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.35.down_proj.weight": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.35.down_proj.weight_scale": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.35.gate_proj.weight": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.35.gate_proj.weight_scale": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.35.up_proj.weight": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.35.up_proj.weight_scale": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.36.down_proj.weight": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.36.down_proj.weight_scale": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.36.gate_proj.weight": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.36.gate_proj.weight_scale": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.36.up_proj.weight": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.36.up_proj.weight_scale": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.37.down_proj.weight": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.37.down_proj.weight_scale": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.37.gate_proj.weight": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.37.gate_proj.weight_scale": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.37.up_proj.weight": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.37.up_proj.weight_scale": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.38.down_proj.weight": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.38.down_proj.weight_scale": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.38.gate_proj.weight": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.38.gate_proj.weight_scale": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.38.up_proj.weight": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.38.up_proj.weight_scale": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.39.down_proj.weight": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.39.down_proj.weight_scale": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.39.gate_proj.weight": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.39.gate_proj.weight_scale": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.39.up_proj.weight": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.39.up_proj.weight_scale": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.4.down_proj.weight": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.4.down_proj.weight_scale": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.4.gate_proj.weight": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.4.gate_proj.weight_scale": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.4.up_proj.weight": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.4.up_proj.weight_scale": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.40.down_proj.weight": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.40.down_proj.weight_scale": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.40.gate_proj.weight": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.40.gate_proj.weight_scale": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.40.up_proj.weight": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.40.up_proj.weight_scale": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.41.down_proj.weight": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.41.down_proj.weight_scale": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.41.gate_proj.weight": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.41.gate_proj.weight_scale": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.41.up_proj.weight": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.41.up_proj.weight_scale": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.42.down_proj.weight": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.42.down_proj.weight_scale": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.42.gate_proj.weight": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.42.gate_proj.weight_scale": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.42.up_proj.weight": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.42.up_proj.weight_scale": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.43.down_proj.weight": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.43.down_proj.weight_scale": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.43.gate_proj.weight": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.43.gate_proj.weight_scale": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.43.up_proj.weight": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.43.up_proj.weight_scale": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.44.down_proj.weight": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.44.down_proj.weight_scale": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.44.gate_proj.weight": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.44.gate_proj.weight_scale": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.44.up_proj.weight": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.44.up_proj.weight_scale": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.45.down_proj.weight": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.45.down_proj.weight_scale": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.45.gate_proj.weight": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.45.gate_proj.weight_scale": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.45.up_proj.weight": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.45.up_proj.weight_scale": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.46.down_proj.weight": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.46.down_proj.weight_scale": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.46.gate_proj.weight": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.46.gate_proj.weight_scale": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.46.up_proj.weight": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.46.up_proj.weight_scale": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.47.down_proj.weight": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.47.down_proj.weight_scale": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.47.gate_proj.weight": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.47.gate_proj.weight_scale": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.47.up_proj.weight": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.47.up_proj.weight_scale": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.48.down_proj.weight": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.48.down_proj.weight_scale": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.48.gate_proj.weight": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.48.gate_proj.weight_scale": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.48.up_proj.weight": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.48.up_proj.weight_scale": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.49.down_proj.weight": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.49.down_proj.weight_scale": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.49.gate_proj.weight": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.49.gate_proj.weight_scale": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.49.up_proj.weight": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.49.up_proj.weight_scale": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.5.down_proj.weight": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.5.down_proj.weight_scale": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.5.gate_proj.weight": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.5.gate_proj.weight_scale": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.5.up_proj.weight": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.5.up_proj.weight_scale": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.50.down_proj.weight": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.50.down_proj.weight_scale": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.50.gate_proj.weight": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.50.gate_proj.weight_scale": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.50.up_proj.weight": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.50.up_proj.weight_scale": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.51.down_proj.weight": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.51.down_proj.weight_scale": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.51.gate_proj.weight": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.51.gate_proj.weight_scale": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.51.up_proj.weight": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.51.up_proj.weight_scale": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.52.down_proj.weight": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.52.down_proj.weight_scale": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.52.gate_proj.weight": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.52.gate_proj.weight_scale": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.52.up_proj.weight": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.52.up_proj.weight_scale": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.53.down_proj.weight": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.53.down_proj.weight_scale": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.53.gate_proj.weight": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.53.gate_proj.weight_scale": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.53.up_proj.weight": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.53.up_proj.weight_scale": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.54.down_proj.weight": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.54.down_proj.weight_scale": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.54.gate_proj.weight": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.54.gate_proj.weight_scale": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.54.up_proj.weight": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.54.up_proj.weight_scale": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.55.down_proj.weight": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.55.down_proj.weight_scale": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.55.gate_proj.weight": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.55.gate_proj.weight_scale": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.55.up_proj.weight": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.55.up_proj.weight_scale": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.56.down_proj.weight": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.56.down_proj.weight_scale": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.56.gate_proj.weight": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.56.gate_proj.weight_scale": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.56.up_proj.weight": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.56.up_proj.weight_scale": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.57.down_proj.weight": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.57.down_proj.weight_scale": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.57.gate_proj.weight": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.57.gate_proj.weight_scale": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.57.up_proj.weight": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.57.up_proj.weight_scale": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.58.down_proj.weight": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.58.down_proj.weight_scale": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.58.gate_proj.weight": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.58.gate_proj.weight_scale": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.58.up_proj.weight": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.58.up_proj.weight_scale": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.59.down_proj.weight": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.59.down_proj.weight_scale": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.59.gate_proj.weight": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.59.gate_proj.weight_scale": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.59.up_proj.weight": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.59.up_proj.weight_scale": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.6.down_proj.weight": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.6.down_proj.weight_scale": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.6.gate_proj.weight": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.6.gate_proj.weight_scale": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.6.up_proj.weight": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.6.up_proj.weight_scale": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.60.down_proj.weight": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.60.down_proj.weight_scale": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.60.gate_proj.weight": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.60.gate_proj.weight_scale": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.60.up_proj.weight": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.60.up_proj.weight_scale": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.61.down_proj.weight": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.61.down_proj.weight_scale": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.61.gate_proj.weight": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.61.gate_proj.weight_scale": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.61.up_proj.weight": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.61.up_proj.weight_scale": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.62.down_proj.weight": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.62.down_proj.weight_scale": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.62.gate_proj.weight": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.62.gate_proj.weight_scale": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.62.up_proj.weight": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.62.up_proj.weight_scale": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.63.down_proj.weight": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.63.down_proj.weight_scale": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.63.gate_proj.weight": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.63.gate_proj.weight_scale": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.63.up_proj.weight": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.63.up_proj.weight_scale": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.64.down_proj.weight": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.64.down_proj.weight_scale": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.64.gate_proj.weight": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.64.gate_proj.weight_scale": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.64.up_proj.weight": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.64.up_proj.weight_scale": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.65.down_proj.weight": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.65.down_proj.weight_scale": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.65.gate_proj.weight": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.65.gate_proj.weight_scale": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.65.up_proj.weight": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.65.up_proj.weight_scale": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.66.down_proj.weight": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.66.down_proj.weight_scale": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.66.gate_proj.weight": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.66.gate_proj.weight_scale": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.66.up_proj.weight": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.66.up_proj.weight_scale": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.67.down_proj.weight": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.67.down_proj.weight_scale": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.67.gate_proj.weight": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.67.gate_proj.weight_scale": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.67.up_proj.weight": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.67.up_proj.weight_scale": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.68.down_proj.weight": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.68.down_proj.weight_scale": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.68.gate_proj.weight": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.68.gate_proj.weight_scale": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.68.up_proj.weight": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.68.up_proj.weight_scale": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.69.down_proj.weight": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.69.down_proj.weight_scale": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.69.gate_proj.weight": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.69.gate_proj.weight_scale": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.69.up_proj.weight": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.69.up_proj.weight_scale": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.7.down_proj.weight": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.7.down_proj.weight_scale": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.7.gate_proj.weight": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.7.gate_proj.weight_scale": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.7.up_proj.weight": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.7.up_proj.weight_scale": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.70.down_proj.weight": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.70.down_proj.weight_scale": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.70.gate_proj.weight": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.70.gate_proj.weight_scale": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.70.up_proj.weight": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.70.up_proj.weight_scale": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.71.down_proj.weight": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.71.down_proj.weight_scale": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.71.gate_proj.weight": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.71.gate_proj.weight_scale": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.71.up_proj.weight": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.71.up_proj.weight_scale": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.72.down_proj.weight": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.72.down_proj.weight_scale": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.72.gate_proj.weight": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.72.gate_proj.weight_scale": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.72.up_proj.weight": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.72.up_proj.weight_scale": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.73.down_proj.weight": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.73.down_proj.weight_scale": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.73.gate_proj.weight": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.73.gate_proj.weight_scale": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.73.up_proj.weight": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.73.up_proj.weight_scale": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.74.down_proj.weight": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.74.down_proj.weight_scale": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.74.gate_proj.weight": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.74.gate_proj.weight_scale": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.74.up_proj.weight": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.74.up_proj.weight_scale": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.75.down_proj.weight": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.75.down_proj.weight_scale": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.75.gate_proj.weight": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.75.gate_proj.weight_scale": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.75.up_proj.weight": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.75.up_proj.weight_scale": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.76.down_proj.weight": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.76.down_proj.weight_scale": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.76.gate_proj.weight": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.76.gate_proj.weight_scale": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.76.up_proj.weight": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.76.up_proj.weight_scale": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.77.down_proj.weight": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.77.down_proj.weight_scale": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.77.gate_proj.weight": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.77.gate_proj.weight_scale": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.77.up_proj.weight": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.77.up_proj.weight_scale": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.78.down_proj.weight": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.78.down_proj.weight_scale": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.78.gate_proj.weight": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.78.gate_proj.weight_scale": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.78.up_proj.weight": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.78.up_proj.weight_scale": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.79.down_proj.weight": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.79.down_proj.weight_scale": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.79.gate_proj.weight": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.79.gate_proj.weight_scale": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.79.up_proj.weight": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.79.up_proj.weight_scale": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.8.down_proj.weight": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.8.down_proj.weight_scale": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.8.gate_proj.weight": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.8.gate_proj.weight_scale": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.8.up_proj.weight": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.8.up_proj.weight_scale": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.80.down_proj.weight": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.80.down_proj.weight_scale": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.80.gate_proj.weight": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.80.gate_proj.weight_scale": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.80.up_proj.weight": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.80.up_proj.weight_scale": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.81.down_proj.weight": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.81.down_proj.weight_scale": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.81.gate_proj.weight": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.81.gate_proj.weight_scale": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.81.up_proj.weight": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.81.up_proj.weight_scale": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.82.down_proj.weight": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.82.down_proj.weight_scale": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.82.gate_proj.weight": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.82.gate_proj.weight_scale": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.82.up_proj.weight": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.82.up_proj.weight_scale": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.83.down_proj.weight": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.83.down_proj.weight_scale": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.83.gate_proj.weight": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.83.gate_proj.weight_scale": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.83.up_proj.weight": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.83.up_proj.weight_scale": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.84.down_proj.weight": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.84.down_proj.weight_scale": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.84.gate_proj.weight": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.84.gate_proj.weight_scale": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.84.up_proj.weight": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.84.up_proj.weight_scale": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.85.down_proj.weight": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.85.down_proj.weight_scale": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.85.gate_proj.weight": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.85.gate_proj.weight_scale": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.85.up_proj.weight": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.85.up_proj.weight_scale": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.86.down_proj.weight": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.86.down_proj.weight_scale": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.86.gate_proj.weight": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.86.gate_proj.weight_scale": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.86.up_proj.weight": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.86.up_proj.weight_scale": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.87.down_proj.weight": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.87.down_proj.weight_scale": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.87.gate_proj.weight": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.87.gate_proj.weight_scale": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.87.up_proj.weight": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.87.up_proj.weight_scale": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.88.down_proj.weight": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.88.down_proj.weight_scale": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.88.gate_proj.weight": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.88.gate_proj.weight_scale": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.88.up_proj.weight": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.88.up_proj.weight_scale": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.89.down_proj.weight": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.89.down_proj.weight_scale": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.89.gate_proj.weight": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.89.gate_proj.weight_scale": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.89.up_proj.weight": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.89.up_proj.weight_scale": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.9.down_proj.weight": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.9.down_proj.weight_scale": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.9.gate_proj.weight": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.9.gate_proj.weight_scale": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.9.up_proj.weight": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.9.up_proj.weight_scale": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.90.down_proj.weight": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.90.down_proj.weight_scale": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.90.gate_proj.weight": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.90.gate_proj.weight_scale": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.90.up_proj.weight": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.90.up_proj.weight_scale": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.91.down_proj.weight": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.91.down_proj.weight_scale": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.91.gate_proj.weight": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.91.gate_proj.weight_scale": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.91.up_proj.weight": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.91.up_proj.weight_scale": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.92.down_proj.weight": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.92.down_proj.weight_scale": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.92.gate_proj.weight": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.92.gate_proj.weight_scale": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.92.up_proj.weight": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.92.up_proj.weight_scale": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.93.down_proj.weight": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.93.down_proj.weight_scale": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.93.gate_proj.weight": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.93.gate_proj.weight_scale": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.93.up_proj.weight": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.93.up_proj.weight_scale": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.94.down_proj.weight": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.94.down_proj.weight_scale": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.94.gate_proj.weight": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.94.gate_proj.weight_scale": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.94.up_proj.weight": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.94.up_proj.weight_scale": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.95.down_proj.weight": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.95.down_proj.weight_scale": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.95.gate_proj.weight": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.95.gate_proj.weight_scale": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.95.up_proj.weight": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.95.up_proj.weight_scale": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.96.down_proj.weight": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.96.down_proj.weight_scale": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.96.gate_proj.weight": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.96.gate_proj.weight_scale": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.96.up_proj.weight": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.96.up_proj.weight_scale": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.97.down_proj.weight": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.97.down_proj.weight_scale": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.97.gate_proj.weight": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.97.gate_proj.weight_scale": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.97.up_proj.weight": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.97.up_proj.weight_scale": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.98.down_proj.weight": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.98.down_proj.weight_scale": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.98.gate_proj.weight": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.98.gate_proj.weight_scale": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.98.up_proj.weight": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.98.up_proj.weight_scale": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.99.down_proj.weight": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.99.down_proj.weight_scale": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.99.gate_proj.weight": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.99.gate_proj.weight_scale": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.99.up_proj.weight": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.99.up_proj.weight_scale": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.gate.e_score_correction_bias": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.gate.weight": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.shared_experts.down_proj.weight": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.shared_experts.down_proj.weight_scale": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.shared_experts.gate_proj.weight": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.shared_experts.gate_proj.weight_scale": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.shared_experts.up_proj.weight": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.shared_experts.up_proj.weight_scale": "model-00070-of-00092.safetensors",
+ "model.layers.69.post_attention_layernorm.weight": "model-00070-of-00092.safetensors",
+ "model.layers.69.self_attn.k_norm.weight": "model-00070-of-00092.safetensors",
+ "model.layers.69.self_attn.k_proj.bias": "model-00070-of-00092.safetensors",
+ "model.layers.69.self_attn.k_proj.weight": "model-00070-of-00092.safetensors",
+ "model.layers.69.self_attn.k_proj.weight_scale": "model-00070-of-00092.safetensors",
+ "model.layers.69.self_attn.o_proj.weight": "model-00070-of-00092.safetensors",
+ "model.layers.69.self_attn.o_proj.weight_scale": "model-00070-of-00092.safetensors",
+ "model.layers.69.self_attn.q_norm.weight": "model-00070-of-00092.safetensors",
+ "model.layers.69.self_attn.q_proj.bias": "model-00070-of-00092.safetensors",
+ "model.layers.69.self_attn.q_proj.weight": "model-00070-of-00092.safetensors",
+ "model.layers.69.self_attn.q_proj.weight_scale": "model-00070-of-00092.safetensors",
+ "model.layers.69.self_attn.v_proj.bias": "model-00070-of-00092.safetensors",
+ "model.layers.69.self_attn.v_proj.weight": "model-00070-of-00092.safetensors",
+ "model.layers.69.self_attn.v_proj.weight_scale": "model-00070-of-00092.safetensors",
+ "model.layers.70.input_layernorm.weight": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.0.down_proj.weight": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.0.down_proj.weight_scale": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.0.gate_proj.weight": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.0.gate_proj.weight_scale": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.0.up_proj.weight": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.0.up_proj.weight_scale": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.1.down_proj.weight": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.1.down_proj.weight_scale": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.1.gate_proj.weight": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.1.gate_proj.weight_scale": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.1.up_proj.weight": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.1.up_proj.weight_scale": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.10.down_proj.weight": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.10.down_proj.weight_scale": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.10.gate_proj.weight": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.10.gate_proj.weight_scale": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.10.up_proj.weight": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.10.up_proj.weight_scale": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.100.down_proj.weight": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.100.down_proj.weight_scale": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.100.gate_proj.weight": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.100.gate_proj.weight_scale": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.100.up_proj.weight": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.100.up_proj.weight_scale": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.101.down_proj.weight": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.101.down_proj.weight_scale": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.101.gate_proj.weight": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.101.gate_proj.weight_scale": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.101.up_proj.weight": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.101.up_proj.weight_scale": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.102.down_proj.weight": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.102.down_proj.weight_scale": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.102.gate_proj.weight": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.102.gate_proj.weight_scale": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.102.up_proj.weight": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.102.up_proj.weight_scale": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.103.down_proj.weight": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.103.down_proj.weight_scale": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.103.gate_proj.weight": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.103.gate_proj.weight_scale": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.103.up_proj.weight": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.103.up_proj.weight_scale": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.104.down_proj.weight": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.104.down_proj.weight_scale": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.104.gate_proj.weight": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.104.gate_proj.weight_scale": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.104.up_proj.weight": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.104.up_proj.weight_scale": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.105.down_proj.weight": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.105.down_proj.weight_scale": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.105.gate_proj.weight": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.105.gate_proj.weight_scale": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.105.up_proj.weight": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.105.up_proj.weight_scale": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.106.down_proj.weight": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.106.down_proj.weight_scale": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.106.gate_proj.weight": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.106.gate_proj.weight_scale": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.106.up_proj.weight": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.106.up_proj.weight_scale": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.107.down_proj.weight": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.107.down_proj.weight_scale": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.107.gate_proj.weight": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.107.gate_proj.weight_scale": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.107.up_proj.weight": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.107.up_proj.weight_scale": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.108.down_proj.weight": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.108.down_proj.weight_scale": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.108.gate_proj.weight": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.108.gate_proj.weight_scale": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.108.up_proj.weight": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.108.up_proj.weight_scale": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.109.down_proj.weight": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.109.down_proj.weight_scale": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.109.gate_proj.weight": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.109.gate_proj.weight_scale": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.109.up_proj.weight": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.109.up_proj.weight_scale": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.11.down_proj.weight": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.11.down_proj.weight_scale": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.11.gate_proj.weight": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.11.gate_proj.weight_scale": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.11.up_proj.weight": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.11.up_proj.weight_scale": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.110.down_proj.weight": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.110.down_proj.weight_scale": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.110.gate_proj.weight": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.110.gate_proj.weight_scale": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.110.up_proj.weight": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.110.up_proj.weight_scale": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.111.down_proj.weight": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.111.down_proj.weight_scale": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.111.gate_proj.weight": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.111.gate_proj.weight_scale": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.111.up_proj.weight": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.111.up_proj.weight_scale": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.112.down_proj.weight": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.112.down_proj.weight_scale": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.112.gate_proj.weight": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.112.gate_proj.weight_scale": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.112.up_proj.weight": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.112.up_proj.weight_scale": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.113.down_proj.weight": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.113.down_proj.weight_scale": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.113.gate_proj.weight": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.113.gate_proj.weight_scale": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.113.up_proj.weight": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.113.up_proj.weight_scale": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.114.down_proj.weight": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.114.down_proj.weight_scale": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.114.gate_proj.weight": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.114.gate_proj.weight_scale": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.114.up_proj.weight": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.114.up_proj.weight_scale": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.115.down_proj.weight": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.115.down_proj.weight_scale": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.115.gate_proj.weight": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.115.gate_proj.weight_scale": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.115.up_proj.weight": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.115.up_proj.weight_scale": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.116.down_proj.weight": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.116.down_proj.weight_scale": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.116.gate_proj.weight": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.116.gate_proj.weight_scale": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.116.up_proj.weight": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.116.up_proj.weight_scale": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.117.down_proj.weight": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.117.down_proj.weight_scale": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.117.gate_proj.weight": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.117.gate_proj.weight_scale": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.117.up_proj.weight": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.117.up_proj.weight_scale": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.118.down_proj.weight": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.118.down_proj.weight_scale": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.118.gate_proj.weight": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.118.gate_proj.weight_scale": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.118.up_proj.weight": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.118.up_proj.weight_scale": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.119.down_proj.weight": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.119.down_proj.weight_scale": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.119.gate_proj.weight": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.119.gate_proj.weight_scale": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.119.up_proj.weight": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.119.up_proj.weight_scale": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.12.down_proj.weight": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.12.down_proj.weight_scale": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.12.gate_proj.weight": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.12.gate_proj.weight_scale": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.12.up_proj.weight": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.12.up_proj.weight_scale": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.120.down_proj.weight": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.120.down_proj.weight_scale": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.120.gate_proj.weight": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.120.gate_proj.weight_scale": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.120.up_proj.weight": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.120.up_proj.weight_scale": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.121.down_proj.weight": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.121.down_proj.weight_scale": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.121.gate_proj.weight": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.121.gate_proj.weight_scale": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.121.up_proj.weight": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.121.up_proj.weight_scale": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.122.down_proj.weight": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.122.down_proj.weight_scale": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.122.gate_proj.weight": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.122.gate_proj.weight_scale": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.122.up_proj.weight": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.122.up_proj.weight_scale": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.123.down_proj.weight": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.123.down_proj.weight_scale": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.123.gate_proj.weight": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.123.gate_proj.weight_scale": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.123.up_proj.weight": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.123.up_proj.weight_scale": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.124.down_proj.weight": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.124.down_proj.weight_scale": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.124.gate_proj.weight": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.124.gate_proj.weight_scale": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.124.up_proj.weight": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.124.up_proj.weight_scale": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.125.down_proj.weight": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.125.down_proj.weight_scale": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.125.gate_proj.weight": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.125.gate_proj.weight_scale": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.125.up_proj.weight": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.125.up_proj.weight_scale": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.126.down_proj.weight": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.126.down_proj.weight_scale": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.126.gate_proj.weight": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.126.gate_proj.weight_scale": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.126.up_proj.weight": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.126.up_proj.weight_scale": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.127.down_proj.weight": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.127.down_proj.weight_scale": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.127.gate_proj.weight": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.127.gate_proj.weight_scale": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.127.up_proj.weight": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.127.up_proj.weight_scale": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.128.down_proj.weight": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.128.down_proj.weight_scale": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.128.gate_proj.weight": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.128.gate_proj.weight_scale": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.128.up_proj.weight": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.128.up_proj.weight_scale": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.129.down_proj.weight": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.129.down_proj.weight_scale": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.129.gate_proj.weight": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.129.gate_proj.weight_scale": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.129.up_proj.weight": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.129.up_proj.weight_scale": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.13.down_proj.weight": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.13.down_proj.weight_scale": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.13.gate_proj.weight": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.13.gate_proj.weight_scale": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.13.up_proj.weight": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.13.up_proj.weight_scale": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.130.down_proj.weight": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.130.down_proj.weight_scale": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.130.gate_proj.weight": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.130.gate_proj.weight_scale": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.130.up_proj.weight": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.130.up_proj.weight_scale": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.131.down_proj.weight": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.131.down_proj.weight_scale": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.131.gate_proj.weight": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.131.gate_proj.weight_scale": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.131.up_proj.weight": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.131.up_proj.weight_scale": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.132.down_proj.weight": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.132.down_proj.weight_scale": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.132.gate_proj.weight": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.132.gate_proj.weight_scale": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.132.up_proj.weight": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.132.up_proj.weight_scale": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.133.down_proj.weight": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.133.down_proj.weight_scale": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.133.gate_proj.weight": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.133.gate_proj.weight_scale": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.133.up_proj.weight": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.133.up_proj.weight_scale": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.134.down_proj.weight": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.134.down_proj.weight_scale": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.134.gate_proj.weight": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.134.gate_proj.weight_scale": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.134.up_proj.weight": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.134.up_proj.weight_scale": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.135.down_proj.weight": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.135.down_proj.weight_scale": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.135.gate_proj.weight": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.135.gate_proj.weight_scale": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.135.up_proj.weight": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.135.up_proj.weight_scale": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.136.down_proj.weight": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.136.down_proj.weight_scale": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.136.gate_proj.weight": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.136.gate_proj.weight_scale": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.136.up_proj.weight": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.136.up_proj.weight_scale": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.137.down_proj.weight": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.137.down_proj.weight_scale": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.137.gate_proj.weight": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.137.gate_proj.weight_scale": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.137.up_proj.weight": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.137.up_proj.weight_scale": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.138.down_proj.weight": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.138.down_proj.weight_scale": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.138.gate_proj.weight": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.138.gate_proj.weight_scale": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.138.up_proj.weight": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.138.up_proj.weight_scale": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.139.down_proj.weight": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.139.down_proj.weight_scale": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.139.gate_proj.weight": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.139.gate_proj.weight_scale": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.139.up_proj.weight": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.139.up_proj.weight_scale": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.14.down_proj.weight": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.14.down_proj.weight_scale": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.14.gate_proj.weight": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.14.gate_proj.weight_scale": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.14.up_proj.weight": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.14.up_proj.weight_scale": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.140.down_proj.weight": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.140.down_proj.weight_scale": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.140.gate_proj.weight": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.140.gate_proj.weight_scale": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.140.up_proj.weight": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.140.up_proj.weight_scale": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.141.down_proj.weight": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.141.down_proj.weight_scale": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.141.gate_proj.weight": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.141.gate_proj.weight_scale": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.141.up_proj.weight": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.141.up_proj.weight_scale": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.142.down_proj.weight": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.142.down_proj.weight_scale": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.142.gate_proj.weight": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.142.gate_proj.weight_scale": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.142.up_proj.weight": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.142.up_proj.weight_scale": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.143.down_proj.weight": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.143.down_proj.weight_scale": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.143.gate_proj.weight": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.143.gate_proj.weight_scale": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.143.up_proj.weight": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.143.up_proj.weight_scale": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.144.down_proj.weight": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.144.down_proj.weight_scale": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.144.gate_proj.weight": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.144.gate_proj.weight_scale": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.144.up_proj.weight": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.144.up_proj.weight_scale": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.145.down_proj.weight": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.145.down_proj.weight_scale": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.145.gate_proj.weight": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.145.gate_proj.weight_scale": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.145.up_proj.weight": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.145.up_proj.weight_scale": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.146.down_proj.weight": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.146.down_proj.weight_scale": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.146.gate_proj.weight": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.146.gate_proj.weight_scale": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.146.up_proj.weight": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.146.up_proj.weight_scale": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.147.down_proj.weight": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.147.down_proj.weight_scale": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.147.gate_proj.weight": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.147.gate_proj.weight_scale": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.147.up_proj.weight": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.147.up_proj.weight_scale": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.148.down_proj.weight": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.148.down_proj.weight_scale": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.148.gate_proj.weight": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.148.gate_proj.weight_scale": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.148.up_proj.weight": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.148.up_proj.weight_scale": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.149.down_proj.weight": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.149.down_proj.weight_scale": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.149.gate_proj.weight": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.149.gate_proj.weight_scale": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.149.up_proj.weight": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.149.up_proj.weight_scale": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.15.down_proj.weight": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.15.down_proj.weight_scale": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.15.gate_proj.weight": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.15.gate_proj.weight_scale": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.15.up_proj.weight": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.15.up_proj.weight_scale": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.150.down_proj.weight": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.150.down_proj.weight_scale": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.150.gate_proj.weight": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.150.gate_proj.weight_scale": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.150.up_proj.weight": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.150.up_proj.weight_scale": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.151.down_proj.weight": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.151.down_proj.weight_scale": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.151.gate_proj.weight": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.151.gate_proj.weight_scale": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.151.up_proj.weight": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.151.up_proj.weight_scale": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.152.down_proj.weight": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.152.down_proj.weight_scale": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.152.gate_proj.weight": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.152.gate_proj.weight_scale": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.152.up_proj.weight": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.152.up_proj.weight_scale": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.153.down_proj.weight": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.153.down_proj.weight_scale": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.153.gate_proj.weight": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.153.gate_proj.weight_scale": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.153.up_proj.weight": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.153.up_proj.weight_scale": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.154.down_proj.weight": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.154.down_proj.weight_scale": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.154.gate_proj.weight": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.154.gate_proj.weight_scale": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.154.up_proj.weight": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.154.up_proj.weight_scale": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.155.down_proj.weight": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.155.down_proj.weight_scale": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.155.gate_proj.weight": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.155.gate_proj.weight_scale": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.155.up_proj.weight": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.155.up_proj.weight_scale": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.156.down_proj.weight": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.156.down_proj.weight_scale": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.156.gate_proj.weight": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.156.gate_proj.weight_scale": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.156.up_proj.weight": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.156.up_proj.weight_scale": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.157.down_proj.weight": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.157.down_proj.weight_scale": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.157.gate_proj.weight": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.157.gate_proj.weight_scale": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.157.up_proj.weight": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.157.up_proj.weight_scale": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.158.down_proj.weight": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.158.down_proj.weight_scale": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.158.gate_proj.weight": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.158.gate_proj.weight_scale": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.158.up_proj.weight": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.158.up_proj.weight_scale": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.159.down_proj.weight": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.159.down_proj.weight_scale": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.159.gate_proj.weight": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.159.gate_proj.weight_scale": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.159.up_proj.weight": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.159.up_proj.weight_scale": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.16.down_proj.weight": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.16.down_proj.weight_scale": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.16.gate_proj.weight": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.16.gate_proj.weight_scale": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.16.up_proj.weight": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.16.up_proj.weight_scale": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.17.down_proj.weight": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.17.down_proj.weight_scale": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.17.gate_proj.weight": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.17.gate_proj.weight_scale": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.17.up_proj.weight": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.17.up_proj.weight_scale": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.18.down_proj.weight": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.18.down_proj.weight_scale": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.18.gate_proj.weight": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.18.gate_proj.weight_scale": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.18.up_proj.weight": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.18.up_proj.weight_scale": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.19.down_proj.weight": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.19.down_proj.weight_scale": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.19.gate_proj.weight": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.19.gate_proj.weight_scale": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.19.up_proj.weight": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.19.up_proj.weight_scale": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.2.down_proj.weight": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.2.down_proj.weight_scale": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.2.gate_proj.weight": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.2.gate_proj.weight_scale": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.2.up_proj.weight": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.2.up_proj.weight_scale": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.20.down_proj.weight": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.20.down_proj.weight_scale": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.20.gate_proj.weight": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.20.gate_proj.weight_scale": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.20.up_proj.weight": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.20.up_proj.weight_scale": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.21.down_proj.weight": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.21.down_proj.weight_scale": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.21.gate_proj.weight": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.21.gate_proj.weight_scale": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.21.up_proj.weight": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.21.up_proj.weight_scale": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.22.down_proj.weight": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.22.down_proj.weight_scale": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.22.gate_proj.weight": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.22.gate_proj.weight_scale": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.22.up_proj.weight": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.22.up_proj.weight_scale": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.23.down_proj.weight": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.23.down_proj.weight_scale": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.23.gate_proj.weight": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.23.gate_proj.weight_scale": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.23.up_proj.weight": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.23.up_proj.weight_scale": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.24.down_proj.weight": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.24.down_proj.weight_scale": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.24.gate_proj.weight": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.24.gate_proj.weight_scale": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.24.up_proj.weight": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.24.up_proj.weight_scale": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.25.down_proj.weight": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.25.down_proj.weight_scale": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.25.gate_proj.weight": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.25.gate_proj.weight_scale": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.25.up_proj.weight": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.25.up_proj.weight_scale": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.26.down_proj.weight": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.26.down_proj.weight_scale": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.26.gate_proj.weight": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.26.gate_proj.weight_scale": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.26.up_proj.weight": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.26.up_proj.weight_scale": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.27.down_proj.weight": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.27.down_proj.weight_scale": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.27.gate_proj.weight": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.27.gate_proj.weight_scale": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.27.up_proj.weight": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.27.up_proj.weight_scale": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.28.down_proj.weight": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.28.down_proj.weight_scale": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.28.gate_proj.weight": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.28.gate_proj.weight_scale": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.28.up_proj.weight": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.28.up_proj.weight_scale": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.29.down_proj.weight": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.29.down_proj.weight_scale": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.29.gate_proj.weight": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.29.gate_proj.weight_scale": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.29.up_proj.weight": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.29.up_proj.weight_scale": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.3.down_proj.weight": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.3.down_proj.weight_scale": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.3.gate_proj.weight": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.3.gate_proj.weight_scale": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.3.up_proj.weight": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.3.up_proj.weight_scale": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.30.down_proj.weight": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.30.down_proj.weight_scale": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.30.gate_proj.weight": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.30.gate_proj.weight_scale": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.30.up_proj.weight": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.30.up_proj.weight_scale": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.31.down_proj.weight": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.31.down_proj.weight_scale": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.31.gate_proj.weight": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.31.gate_proj.weight_scale": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.31.up_proj.weight": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.31.up_proj.weight_scale": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.32.down_proj.weight": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.32.down_proj.weight_scale": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.32.gate_proj.weight": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.32.gate_proj.weight_scale": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.32.up_proj.weight": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.32.up_proj.weight_scale": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.33.down_proj.weight": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.33.down_proj.weight_scale": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.33.gate_proj.weight": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.33.gate_proj.weight_scale": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.33.up_proj.weight": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.33.up_proj.weight_scale": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.34.down_proj.weight": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.34.down_proj.weight_scale": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.34.gate_proj.weight": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.34.gate_proj.weight_scale": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.34.up_proj.weight": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.34.up_proj.weight_scale": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.35.down_proj.weight": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.35.down_proj.weight_scale": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.35.gate_proj.weight": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.35.gate_proj.weight_scale": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.35.up_proj.weight": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.35.up_proj.weight_scale": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.36.down_proj.weight": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.36.down_proj.weight_scale": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.36.gate_proj.weight": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.36.gate_proj.weight_scale": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.36.up_proj.weight": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.36.up_proj.weight_scale": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.37.down_proj.weight": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.37.down_proj.weight_scale": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.37.gate_proj.weight": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.37.gate_proj.weight_scale": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.37.up_proj.weight": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.37.up_proj.weight_scale": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.38.down_proj.weight": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.38.down_proj.weight_scale": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.38.gate_proj.weight": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.38.gate_proj.weight_scale": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.38.up_proj.weight": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.38.up_proj.weight_scale": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.39.down_proj.weight": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.39.down_proj.weight_scale": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.39.gate_proj.weight": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.39.gate_proj.weight_scale": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.39.up_proj.weight": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.39.up_proj.weight_scale": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.4.down_proj.weight": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.4.down_proj.weight_scale": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.4.gate_proj.weight": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.4.gate_proj.weight_scale": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.4.up_proj.weight": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.4.up_proj.weight_scale": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.40.down_proj.weight": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.40.down_proj.weight_scale": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.40.gate_proj.weight": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.40.gate_proj.weight_scale": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.40.up_proj.weight": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.40.up_proj.weight_scale": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.41.down_proj.weight": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.41.down_proj.weight_scale": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.41.gate_proj.weight": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.41.gate_proj.weight_scale": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.41.up_proj.weight": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.41.up_proj.weight_scale": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.42.down_proj.weight": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.42.down_proj.weight_scale": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.42.gate_proj.weight": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.42.gate_proj.weight_scale": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.42.up_proj.weight": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.42.up_proj.weight_scale": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.43.down_proj.weight": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.43.down_proj.weight_scale": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.43.gate_proj.weight": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.43.gate_proj.weight_scale": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.43.up_proj.weight": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.43.up_proj.weight_scale": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.44.down_proj.weight": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.44.down_proj.weight_scale": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.44.gate_proj.weight": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.44.gate_proj.weight_scale": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.44.up_proj.weight": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.44.up_proj.weight_scale": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.45.down_proj.weight": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.45.down_proj.weight_scale": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.45.gate_proj.weight": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.45.gate_proj.weight_scale": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.45.up_proj.weight": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.45.up_proj.weight_scale": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.46.down_proj.weight": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.46.down_proj.weight_scale": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.46.gate_proj.weight": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.46.gate_proj.weight_scale": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.46.up_proj.weight": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.46.up_proj.weight_scale": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.47.down_proj.weight": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.47.down_proj.weight_scale": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.47.gate_proj.weight": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.47.gate_proj.weight_scale": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.47.up_proj.weight": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.47.up_proj.weight_scale": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.48.down_proj.weight": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.48.down_proj.weight_scale": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.48.gate_proj.weight": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.48.gate_proj.weight_scale": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.48.up_proj.weight": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.48.up_proj.weight_scale": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.49.down_proj.weight": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.49.down_proj.weight_scale": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.49.gate_proj.weight": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.49.gate_proj.weight_scale": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.49.up_proj.weight": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.49.up_proj.weight_scale": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.5.down_proj.weight": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.5.down_proj.weight_scale": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.5.gate_proj.weight": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.5.gate_proj.weight_scale": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.5.up_proj.weight": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.5.up_proj.weight_scale": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.50.down_proj.weight": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.50.down_proj.weight_scale": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.50.gate_proj.weight": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.50.gate_proj.weight_scale": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.50.up_proj.weight": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.50.up_proj.weight_scale": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.51.down_proj.weight": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.51.down_proj.weight_scale": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.51.gate_proj.weight": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.51.gate_proj.weight_scale": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.51.up_proj.weight": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.51.up_proj.weight_scale": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.52.down_proj.weight": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.52.down_proj.weight_scale": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.52.gate_proj.weight": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.52.gate_proj.weight_scale": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.52.up_proj.weight": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.52.up_proj.weight_scale": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.53.down_proj.weight": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.53.down_proj.weight_scale": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.53.gate_proj.weight": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.53.gate_proj.weight_scale": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.53.up_proj.weight": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.53.up_proj.weight_scale": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.54.down_proj.weight": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.54.down_proj.weight_scale": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.54.gate_proj.weight": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.54.gate_proj.weight_scale": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.54.up_proj.weight": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.54.up_proj.weight_scale": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.55.down_proj.weight": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.55.down_proj.weight_scale": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.55.gate_proj.weight": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.55.gate_proj.weight_scale": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.55.up_proj.weight": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.55.up_proj.weight_scale": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.56.down_proj.weight": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.56.down_proj.weight_scale": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.56.gate_proj.weight": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.56.gate_proj.weight_scale": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.56.up_proj.weight": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.56.up_proj.weight_scale": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.57.down_proj.weight": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.57.down_proj.weight_scale": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.57.gate_proj.weight": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.57.gate_proj.weight_scale": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.57.up_proj.weight": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.57.up_proj.weight_scale": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.58.down_proj.weight": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.58.down_proj.weight_scale": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.58.gate_proj.weight": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.58.gate_proj.weight_scale": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.58.up_proj.weight": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.58.up_proj.weight_scale": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.59.down_proj.weight": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.59.down_proj.weight_scale": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.59.gate_proj.weight": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.59.gate_proj.weight_scale": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.59.up_proj.weight": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.59.up_proj.weight_scale": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.6.down_proj.weight": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.6.down_proj.weight_scale": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.6.gate_proj.weight": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.6.gate_proj.weight_scale": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.6.up_proj.weight": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.6.up_proj.weight_scale": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.60.down_proj.weight": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.60.down_proj.weight_scale": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.60.gate_proj.weight": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.60.gate_proj.weight_scale": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.60.up_proj.weight": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.60.up_proj.weight_scale": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.61.down_proj.weight": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.61.down_proj.weight_scale": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.61.gate_proj.weight": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.61.gate_proj.weight_scale": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.61.up_proj.weight": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.61.up_proj.weight_scale": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.62.down_proj.weight": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.62.down_proj.weight_scale": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.62.gate_proj.weight": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.62.gate_proj.weight_scale": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.62.up_proj.weight": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.62.up_proj.weight_scale": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.63.down_proj.weight": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.63.down_proj.weight_scale": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.63.gate_proj.weight": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.63.gate_proj.weight_scale": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.63.up_proj.weight": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.63.up_proj.weight_scale": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.64.down_proj.weight": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.64.down_proj.weight_scale": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.64.gate_proj.weight": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.64.gate_proj.weight_scale": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.64.up_proj.weight": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.64.up_proj.weight_scale": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.65.down_proj.weight": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.65.down_proj.weight_scale": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.65.gate_proj.weight": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.65.gate_proj.weight_scale": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.65.up_proj.weight": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.65.up_proj.weight_scale": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.66.down_proj.weight": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.66.down_proj.weight_scale": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.66.gate_proj.weight": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.66.gate_proj.weight_scale": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.66.up_proj.weight": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.66.up_proj.weight_scale": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.67.down_proj.weight": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.67.down_proj.weight_scale": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.67.gate_proj.weight": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.67.gate_proj.weight_scale": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.67.up_proj.weight": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.67.up_proj.weight_scale": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.68.down_proj.weight": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.68.down_proj.weight_scale": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.68.gate_proj.weight": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.68.gate_proj.weight_scale": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.68.up_proj.weight": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.68.up_proj.weight_scale": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.69.down_proj.weight": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.69.down_proj.weight_scale": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.69.gate_proj.weight": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.69.gate_proj.weight_scale": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.69.up_proj.weight": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.69.up_proj.weight_scale": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.7.down_proj.weight": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.7.down_proj.weight_scale": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.7.gate_proj.weight": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.7.gate_proj.weight_scale": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.7.up_proj.weight": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.7.up_proj.weight_scale": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.70.down_proj.weight": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.70.down_proj.weight_scale": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.70.gate_proj.weight": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.70.gate_proj.weight_scale": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.70.up_proj.weight": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.70.up_proj.weight_scale": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.71.down_proj.weight": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.71.down_proj.weight_scale": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.71.gate_proj.weight": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.71.gate_proj.weight_scale": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.71.up_proj.weight": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.71.up_proj.weight_scale": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.72.down_proj.weight": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.72.down_proj.weight_scale": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.72.gate_proj.weight": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.72.gate_proj.weight_scale": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.72.up_proj.weight": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.72.up_proj.weight_scale": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.73.down_proj.weight": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.73.down_proj.weight_scale": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.73.gate_proj.weight": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.73.gate_proj.weight_scale": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.73.up_proj.weight": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.73.up_proj.weight_scale": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.74.down_proj.weight": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.74.down_proj.weight_scale": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.74.gate_proj.weight": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.74.gate_proj.weight_scale": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.74.up_proj.weight": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.74.up_proj.weight_scale": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.75.down_proj.weight": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.75.down_proj.weight_scale": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.75.gate_proj.weight": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.75.gate_proj.weight_scale": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.75.up_proj.weight": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.75.up_proj.weight_scale": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.76.down_proj.weight": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.76.down_proj.weight_scale": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.76.gate_proj.weight": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.76.gate_proj.weight_scale": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.76.up_proj.weight": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.76.up_proj.weight_scale": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.77.down_proj.weight": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.77.down_proj.weight_scale": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.77.gate_proj.weight": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.77.gate_proj.weight_scale": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.77.up_proj.weight": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.77.up_proj.weight_scale": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.78.down_proj.weight": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.78.down_proj.weight_scale": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.78.gate_proj.weight": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.78.gate_proj.weight_scale": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.78.up_proj.weight": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.78.up_proj.weight_scale": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.79.down_proj.weight": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.79.down_proj.weight_scale": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.79.gate_proj.weight": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.79.gate_proj.weight_scale": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.79.up_proj.weight": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.79.up_proj.weight_scale": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.8.down_proj.weight": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.8.down_proj.weight_scale": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.8.gate_proj.weight": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.8.gate_proj.weight_scale": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.8.up_proj.weight": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.8.up_proj.weight_scale": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.80.down_proj.weight": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.80.down_proj.weight_scale": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.80.gate_proj.weight": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.80.gate_proj.weight_scale": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.80.up_proj.weight": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.80.up_proj.weight_scale": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.81.down_proj.weight": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.81.down_proj.weight_scale": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.81.gate_proj.weight": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.81.gate_proj.weight_scale": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.81.up_proj.weight": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.81.up_proj.weight_scale": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.82.down_proj.weight": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.82.down_proj.weight_scale": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.82.gate_proj.weight": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.82.gate_proj.weight_scale": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.82.up_proj.weight": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.82.up_proj.weight_scale": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.83.down_proj.weight": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.83.down_proj.weight_scale": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.83.gate_proj.weight": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.83.gate_proj.weight_scale": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.83.up_proj.weight": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.83.up_proj.weight_scale": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.84.down_proj.weight": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.84.down_proj.weight_scale": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.84.gate_proj.weight": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.84.gate_proj.weight_scale": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.84.up_proj.weight": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.84.up_proj.weight_scale": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.85.down_proj.weight": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.85.down_proj.weight_scale": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.85.gate_proj.weight": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.85.gate_proj.weight_scale": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.85.up_proj.weight": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.85.up_proj.weight_scale": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.86.down_proj.weight": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.86.down_proj.weight_scale": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.86.gate_proj.weight": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.86.gate_proj.weight_scale": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.86.up_proj.weight": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.86.up_proj.weight_scale": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.87.down_proj.weight": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.87.down_proj.weight_scale": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.87.gate_proj.weight": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.87.gate_proj.weight_scale": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.87.up_proj.weight": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.87.up_proj.weight_scale": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.88.down_proj.weight": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.88.down_proj.weight_scale": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.88.gate_proj.weight": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.88.gate_proj.weight_scale": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.88.up_proj.weight": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.88.up_proj.weight_scale": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.89.down_proj.weight": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.89.down_proj.weight_scale": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.89.gate_proj.weight": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.89.gate_proj.weight_scale": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.89.up_proj.weight": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.89.up_proj.weight_scale": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.9.down_proj.weight": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.9.down_proj.weight_scale": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.9.gate_proj.weight": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.9.gate_proj.weight_scale": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.9.up_proj.weight": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.9.up_proj.weight_scale": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.90.down_proj.weight": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.90.down_proj.weight_scale": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.90.gate_proj.weight": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.90.gate_proj.weight_scale": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.90.up_proj.weight": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.90.up_proj.weight_scale": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.91.down_proj.weight": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.91.down_proj.weight_scale": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.91.gate_proj.weight": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.91.gate_proj.weight_scale": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.91.up_proj.weight": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.91.up_proj.weight_scale": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.92.down_proj.weight": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.92.down_proj.weight_scale": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.92.gate_proj.weight": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.92.gate_proj.weight_scale": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.92.up_proj.weight": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.92.up_proj.weight_scale": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.93.down_proj.weight": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.93.down_proj.weight_scale": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.93.gate_proj.weight": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.93.gate_proj.weight_scale": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.93.up_proj.weight": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.93.up_proj.weight_scale": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.94.down_proj.weight": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.94.down_proj.weight_scale": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.94.gate_proj.weight": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.94.gate_proj.weight_scale": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.94.up_proj.weight": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.94.up_proj.weight_scale": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.95.down_proj.weight": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.95.down_proj.weight_scale": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.95.gate_proj.weight": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.95.gate_proj.weight_scale": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.95.up_proj.weight": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.95.up_proj.weight_scale": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.96.down_proj.weight": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.96.down_proj.weight_scale": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.96.gate_proj.weight": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.96.gate_proj.weight_scale": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.96.up_proj.weight": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.96.up_proj.weight_scale": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.97.down_proj.weight": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.97.down_proj.weight_scale": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.97.gate_proj.weight": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.97.gate_proj.weight_scale": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.97.up_proj.weight": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.97.up_proj.weight_scale": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.98.down_proj.weight": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.98.down_proj.weight_scale": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.98.gate_proj.weight": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.98.gate_proj.weight_scale": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.98.up_proj.weight": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.98.up_proj.weight_scale": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.99.down_proj.weight": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.99.down_proj.weight_scale": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.99.gate_proj.weight": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.99.gate_proj.weight_scale": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.99.up_proj.weight": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.99.up_proj.weight_scale": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.gate.e_score_correction_bias": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.gate.weight": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.shared_experts.down_proj.weight": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.shared_experts.down_proj.weight_scale": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.shared_experts.gate_proj.weight": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.shared_experts.gate_proj.weight_scale": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.shared_experts.up_proj.weight": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.shared_experts.up_proj.weight_scale": "model-00071-of-00092.safetensors",
+ "model.layers.70.post_attention_layernorm.weight": "model-00071-of-00092.safetensors",
+ "model.layers.70.self_attn.k_norm.weight": "model-00071-of-00092.safetensors",
+ "model.layers.70.self_attn.k_proj.bias": "model-00071-of-00092.safetensors",
+ "model.layers.70.self_attn.k_proj.weight": "model-00071-of-00092.safetensors",
+ "model.layers.70.self_attn.k_proj.weight_scale": "model-00071-of-00092.safetensors",
+ "model.layers.70.self_attn.o_proj.weight": "model-00071-of-00092.safetensors",
+ "model.layers.70.self_attn.o_proj.weight_scale": "model-00071-of-00092.safetensors",
+ "model.layers.70.self_attn.q_norm.weight": "model-00071-of-00092.safetensors",
+ "model.layers.70.self_attn.q_proj.bias": "model-00071-of-00092.safetensors",
+ "model.layers.70.self_attn.q_proj.weight": "model-00071-of-00092.safetensors",
+ "model.layers.70.self_attn.q_proj.weight_scale": "model-00071-of-00092.safetensors",
+ "model.layers.70.self_attn.v_proj.bias": "model-00071-of-00092.safetensors",
+ "model.layers.70.self_attn.v_proj.weight": "model-00071-of-00092.safetensors",
+ "model.layers.70.self_attn.v_proj.weight_scale": "model-00071-of-00092.safetensors",
+ "model.layers.71.input_layernorm.weight": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.0.down_proj.weight": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.0.down_proj.weight_scale": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.0.gate_proj.weight": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.0.gate_proj.weight_scale": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.0.up_proj.weight": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.0.up_proj.weight_scale": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.1.down_proj.weight": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.1.down_proj.weight_scale": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.1.gate_proj.weight": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.1.gate_proj.weight_scale": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.1.up_proj.weight": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.1.up_proj.weight_scale": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.10.down_proj.weight": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.10.down_proj.weight_scale": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.10.gate_proj.weight": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.10.gate_proj.weight_scale": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.10.up_proj.weight": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.10.up_proj.weight_scale": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.100.down_proj.weight": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.100.down_proj.weight_scale": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.100.gate_proj.weight": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.100.gate_proj.weight_scale": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.100.up_proj.weight": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.100.up_proj.weight_scale": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.101.down_proj.weight": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.101.down_proj.weight_scale": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.101.gate_proj.weight": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.101.gate_proj.weight_scale": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.101.up_proj.weight": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.101.up_proj.weight_scale": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.102.down_proj.weight": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.102.down_proj.weight_scale": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.102.gate_proj.weight": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.102.gate_proj.weight_scale": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.102.up_proj.weight": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.102.up_proj.weight_scale": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.103.down_proj.weight": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.103.down_proj.weight_scale": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.103.gate_proj.weight": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.103.gate_proj.weight_scale": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.103.up_proj.weight": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.103.up_proj.weight_scale": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.104.down_proj.weight": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.104.down_proj.weight_scale": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.104.gate_proj.weight": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.104.gate_proj.weight_scale": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.104.up_proj.weight": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.104.up_proj.weight_scale": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.105.down_proj.weight": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.105.down_proj.weight_scale": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.105.gate_proj.weight": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.105.gate_proj.weight_scale": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.105.up_proj.weight": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.105.up_proj.weight_scale": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.106.down_proj.weight": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.106.down_proj.weight_scale": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.106.gate_proj.weight": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.106.gate_proj.weight_scale": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.106.up_proj.weight": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.106.up_proj.weight_scale": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.107.down_proj.weight": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.107.down_proj.weight_scale": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.107.gate_proj.weight": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.107.gate_proj.weight_scale": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.107.up_proj.weight": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.107.up_proj.weight_scale": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.108.down_proj.weight": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.108.down_proj.weight_scale": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.108.gate_proj.weight": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.108.gate_proj.weight_scale": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.108.up_proj.weight": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.108.up_proj.weight_scale": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.109.down_proj.weight": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.109.down_proj.weight_scale": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.109.gate_proj.weight": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.109.gate_proj.weight_scale": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.109.up_proj.weight": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.109.up_proj.weight_scale": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.11.down_proj.weight": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.11.down_proj.weight_scale": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.11.gate_proj.weight": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.11.gate_proj.weight_scale": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.11.up_proj.weight": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.11.up_proj.weight_scale": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.110.down_proj.weight": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.110.down_proj.weight_scale": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.110.gate_proj.weight": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.110.gate_proj.weight_scale": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.110.up_proj.weight": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.110.up_proj.weight_scale": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.111.down_proj.weight": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.111.down_proj.weight_scale": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.111.gate_proj.weight": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.111.gate_proj.weight_scale": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.111.up_proj.weight": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.111.up_proj.weight_scale": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.112.down_proj.weight": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.112.down_proj.weight_scale": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.112.gate_proj.weight": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.112.gate_proj.weight_scale": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.112.up_proj.weight": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.112.up_proj.weight_scale": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.113.down_proj.weight": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.113.down_proj.weight_scale": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.113.gate_proj.weight": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.113.gate_proj.weight_scale": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.113.up_proj.weight": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.113.up_proj.weight_scale": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.114.down_proj.weight": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.114.down_proj.weight_scale": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.114.gate_proj.weight": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.114.gate_proj.weight_scale": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.114.up_proj.weight": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.114.up_proj.weight_scale": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.115.down_proj.weight": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.115.down_proj.weight_scale": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.115.gate_proj.weight": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.115.gate_proj.weight_scale": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.115.up_proj.weight": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.115.up_proj.weight_scale": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.116.down_proj.weight": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.116.down_proj.weight_scale": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.116.gate_proj.weight": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.116.gate_proj.weight_scale": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.116.up_proj.weight": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.116.up_proj.weight_scale": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.117.down_proj.weight": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.117.down_proj.weight_scale": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.117.gate_proj.weight": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.117.gate_proj.weight_scale": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.117.up_proj.weight": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.117.up_proj.weight_scale": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.118.down_proj.weight": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.118.down_proj.weight_scale": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.118.gate_proj.weight": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.118.gate_proj.weight_scale": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.118.up_proj.weight": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.118.up_proj.weight_scale": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.119.down_proj.weight": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.119.down_proj.weight_scale": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.119.gate_proj.weight": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.119.gate_proj.weight_scale": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.119.up_proj.weight": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.119.up_proj.weight_scale": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.12.down_proj.weight": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.12.down_proj.weight_scale": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.12.gate_proj.weight": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.12.gate_proj.weight_scale": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.12.up_proj.weight": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.12.up_proj.weight_scale": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.120.down_proj.weight": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.120.down_proj.weight_scale": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.120.gate_proj.weight": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.120.gate_proj.weight_scale": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.120.up_proj.weight": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.120.up_proj.weight_scale": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.121.down_proj.weight": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.121.down_proj.weight_scale": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.121.gate_proj.weight": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.121.gate_proj.weight_scale": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.121.up_proj.weight": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.121.up_proj.weight_scale": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.122.down_proj.weight": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.122.down_proj.weight_scale": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.122.gate_proj.weight": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.122.gate_proj.weight_scale": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.122.up_proj.weight": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.122.up_proj.weight_scale": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.123.down_proj.weight": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.123.down_proj.weight_scale": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.123.gate_proj.weight": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.123.gate_proj.weight_scale": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.123.up_proj.weight": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.123.up_proj.weight_scale": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.124.down_proj.weight": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.124.down_proj.weight_scale": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.124.gate_proj.weight": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.124.gate_proj.weight_scale": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.124.up_proj.weight": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.124.up_proj.weight_scale": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.125.down_proj.weight": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.125.down_proj.weight_scale": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.125.gate_proj.weight": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.125.gate_proj.weight_scale": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.125.up_proj.weight": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.125.up_proj.weight_scale": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.126.down_proj.weight": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.126.down_proj.weight_scale": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.126.gate_proj.weight": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.126.gate_proj.weight_scale": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.126.up_proj.weight": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.126.up_proj.weight_scale": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.127.down_proj.weight": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.127.down_proj.weight_scale": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.127.gate_proj.weight": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.127.gate_proj.weight_scale": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.127.up_proj.weight": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.127.up_proj.weight_scale": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.128.down_proj.weight": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.128.down_proj.weight_scale": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.128.gate_proj.weight": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.128.gate_proj.weight_scale": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.128.up_proj.weight": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.128.up_proj.weight_scale": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.129.down_proj.weight": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.129.down_proj.weight_scale": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.129.gate_proj.weight": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.129.gate_proj.weight_scale": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.129.up_proj.weight": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.129.up_proj.weight_scale": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.13.down_proj.weight": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.13.down_proj.weight_scale": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.13.gate_proj.weight": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.13.gate_proj.weight_scale": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.13.up_proj.weight": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.13.up_proj.weight_scale": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.130.down_proj.weight": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.130.down_proj.weight_scale": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.130.gate_proj.weight": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.130.gate_proj.weight_scale": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.130.up_proj.weight": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.130.up_proj.weight_scale": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.131.down_proj.weight": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.131.down_proj.weight_scale": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.131.gate_proj.weight": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.131.gate_proj.weight_scale": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.131.up_proj.weight": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.131.up_proj.weight_scale": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.132.down_proj.weight": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.132.down_proj.weight_scale": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.132.gate_proj.weight": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.132.gate_proj.weight_scale": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.132.up_proj.weight": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.132.up_proj.weight_scale": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.133.down_proj.weight": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.133.down_proj.weight_scale": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.133.gate_proj.weight": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.133.gate_proj.weight_scale": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.133.up_proj.weight": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.133.up_proj.weight_scale": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.134.down_proj.weight": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.134.down_proj.weight_scale": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.134.gate_proj.weight": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.134.gate_proj.weight_scale": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.134.up_proj.weight": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.134.up_proj.weight_scale": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.135.down_proj.weight": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.135.down_proj.weight_scale": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.135.gate_proj.weight": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.135.gate_proj.weight_scale": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.135.up_proj.weight": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.135.up_proj.weight_scale": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.136.down_proj.weight": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.136.down_proj.weight_scale": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.136.gate_proj.weight": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.136.gate_proj.weight_scale": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.136.up_proj.weight": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.136.up_proj.weight_scale": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.137.down_proj.weight": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.137.down_proj.weight_scale": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.137.gate_proj.weight": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.137.gate_proj.weight_scale": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.137.up_proj.weight": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.137.up_proj.weight_scale": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.138.down_proj.weight": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.138.down_proj.weight_scale": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.138.gate_proj.weight": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.138.gate_proj.weight_scale": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.138.up_proj.weight": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.138.up_proj.weight_scale": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.139.down_proj.weight": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.139.down_proj.weight_scale": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.139.gate_proj.weight": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.139.gate_proj.weight_scale": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.139.up_proj.weight": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.139.up_proj.weight_scale": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.14.down_proj.weight": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.14.down_proj.weight_scale": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.14.gate_proj.weight": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.14.gate_proj.weight_scale": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.14.up_proj.weight": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.14.up_proj.weight_scale": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.140.down_proj.weight": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.140.down_proj.weight_scale": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.140.gate_proj.weight": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.140.gate_proj.weight_scale": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.140.up_proj.weight": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.140.up_proj.weight_scale": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.141.down_proj.weight": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.141.down_proj.weight_scale": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.141.gate_proj.weight": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.141.gate_proj.weight_scale": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.141.up_proj.weight": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.141.up_proj.weight_scale": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.142.down_proj.weight": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.142.down_proj.weight_scale": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.142.gate_proj.weight": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.142.gate_proj.weight_scale": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.142.up_proj.weight": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.142.up_proj.weight_scale": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.143.down_proj.weight": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.143.down_proj.weight_scale": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.143.gate_proj.weight": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.143.gate_proj.weight_scale": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.143.up_proj.weight": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.143.up_proj.weight_scale": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.144.down_proj.weight": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.144.down_proj.weight_scale": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.144.gate_proj.weight": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.144.gate_proj.weight_scale": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.144.up_proj.weight": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.144.up_proj.weight_scale": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.145.down_proj.weight": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.145.down_proj.weight_scale": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.145.gate_proj.weight": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.145.gate_proj.weight_scale": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.145.up_proj.weight": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.145.up_proj.weight_scale": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.146.down_proj.weight": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.146.down_proj.weight_scale": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.146.gate_proj.weight": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.146.gate_proj.weight_scale": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.146.up_proj.weight": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.146.up_proj.weight_scale": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.147.down_proj.weight": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.147.down_proj.weight_scale": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.147.gate_proj.weight": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.147.gate_proj.weight_scale": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.147.up_proj.weight": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.147.up_proj.weight_scale": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.148.down_proj.weight": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.148.down_proj.weight_scale": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.148.gate_proj.weight": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.148.gate_proj.weight_scale": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.148.up_proj.weight": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.148.up_proj.weight_scale": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.149.down_proj.weight": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.149.down_proj.weight_scale": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.149.gate_proj.weight": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.149.gate_proj.weight_scale": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.149.up_proj.weight": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.149.up_proj.weight_scale": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.15.down_proj.weight": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.15.down_proj.weight_scale": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.15.gate_proj.weight": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.15.gate_proj.weight_scale": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.15.up_proj.weight": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.15.up_proj.weight_scale": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.150.down_proj.weight": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.150.down_proj.weight_scale": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.150.gate_proj.weight": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.150.gate_proj.weight_scale": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.150.up_proj.weight": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.150.up_proj.weight_scale": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.151.down_proj.weight": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.151.down_proj.weight_scale": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.151.gate_proj.weight": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.151.gate_proj.weight_scale": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.151.up_proj.weight": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.151.up_proj.weight_scale": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.152.down_proj.weight": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.152.down_proj.weight_scale": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.152.gate_proj.weight": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.152.gate_proj.weight_scale": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.152.up_proj.weight": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.152.up_proj.weight_scale": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.153.down_proj.weight": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.153.down_proj.weight_scale": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.153.gate_proj.weight": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.153.gate_proj.weight_scale": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.153.up_proj.weight": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.153.up_proj.weight_scale": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.154.down_proj.weight": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.154.down_proj.weight_scale": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.154.gate_proj.weight": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.154.gate_proj.weight_scale": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.154.up_proj.weight": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.154.up_proj.weight_scale": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.155.down_proj.weight": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.155.down_proj.weight_scale": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.155.gate_proj.weight": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.155.gate_proj.weight_scale": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.155.up_proj.weight": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.155.up_proj.weight_scale": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.156.down_proj.weight": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.156.down_proj.weight_scale": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.156.gate_proj.weight": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.156.gate_proj.weight_scale": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.156.up_proj.weight": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.156.up_proj.weight_scale": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.157.down_proj.weight": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.157.down_proj.weight_scale": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.157.gate_proj.weight": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.157.gate_proj.weight_scale": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.157.up_proj.weight": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.157.up_proj.weight_scale": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.158.down_proj.weight": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.158.down_proj.weight_scale": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.158.gate_proj.weight": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.158.gate_proj.weight_scale": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.158.up_proj.weight": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.158.up_proj.weight_scale": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.159.down_proj.weight": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.159.down_proj.weight_scale": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.159.gate_proj.weight": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.159.gate_proj.weight_scale": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.159.up_proj.weight": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.159.up_proj.weight_scale": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.16.down_proj.weight": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.16.down_proj.weight_scale": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.16.gate_proj.weight": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.16.gate_proj.weight_scale": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.16.up_proj.weight": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.16.up_proj.weight_scale": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.17.down_proj.weight": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.17.down_proj.weight_scale": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.17.gate_proj.weight": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.17.gate_proj.weight_scale": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.17.up_proj.weight": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.17.up_proj.weight_scale": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.18.down_proj.weight": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.18.down_proj.weight_scale": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.18.gate_proj.weight": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.18.gate_proj.weight_scale": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.18.up_proj.weight": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.18.up_proj.weight_scale": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.19.down_proj.weight": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.19.down_proj.weight_scale": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.19.gate_proj.weight": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.19.gate_proj.weight_scale": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.19.up_proj.weight": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.19.up_proj.weight_scale": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.2.down_proj.weight": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.2.down_proj.weight_scale": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.2.gate_proj.weight": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.2.gate_proj.weight_scale": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.2.up_proj.weight": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.2.up_proj.weight_scale": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.20.down_proj.weight": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.20.down_proj.weight_scale": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.20.gate_proj.weight": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.20.gate_proj.weight_scale": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.20.up_proj.weight": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.20.up_proj.weight_scale": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.21.down_proj.weight": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.21.down_proj.weight_scale": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.21.gate_proj.weight": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.21.gate_proj.weight_scale": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.21.up_proj.weight": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.21.up_proj.weight_scale": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.22.down_proj.weight": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.22.down_proj.weight_scale": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.22.gate_proj.weight": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.22.gate_proj.weight_scale": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.22.up_proj.weight": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.22.up_proj.weight_scale": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.23.down_proj.weight": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.23.down_proj.weight_scale": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.23.gate_proj.weight": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.23.gate_proj.weight_scale": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.23.up_proj.weight": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.23.up_proj.weight_scale": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.24.down_proj.weight": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.24.down_proj.weight_scale": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.24.gate_proj.weight": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.24.gate_proj.weight_scale": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.24.up_proj.weight": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.24.up_proj.weight_scale": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.25.down_proj.weight": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.25.down_proj.weight_scale": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.25.gate_proj.weight": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.25.gate_proj.weight_scale": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.25.up_proj.weight": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.25.up_proj.weight_scale": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.26.down_proj.weight": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.26.down_proj.weight_scale": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.26.gate_proj.weight": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.26.gate_proj.weight_scale": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.26.up_proj.weight": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.26.up_proj.weight_scale": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.27.down_proj.weight": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.27.down_proj.weight_scale": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.27.gate_proj.weight": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.27.gate_proj.weight_scale": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.27.up_proj.weight": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.27.up_proj.weight_scale": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.28.down_proj.weight": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.28.down_proj.weight_scale": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.28.gate_proj.weight": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.28.gate_proj.weight_scale": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.28.up_proj.weight": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.28.up_proj.weight_scale": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.29.down_proj.weight": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.29.down_proj.weight_scale": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.29.gate_proj.weight": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.29.gate_proj.weight_scale": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.29.up_proj.weight": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.29.up_proj.weight_scale": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.3.down_proj.weight": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.3.down_proj.weight_scale": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.3.gate_proj.weight": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.3.gate_proj.weight_scale": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.3.up_proj.weight": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.3.up_proj.weight_scale": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.30.down_proj.weight": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.30.down_proj.weight_scale": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.30.gate_proj.weight": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.30.gate_proj.weight_scale": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.30.up_proj.weight": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.30.up_proj.weight_scale": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.31.down_proj.weight": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.31.down_proj.weight_scale": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.31.gate_proj.weight": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.31.gate_proj.weight_scale": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.31.up_proj.weight": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.31.up_proj.weight_scale": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.32.down_proj.weight": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.32.down_proj.weight_scale": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.32.gate_proj.weight": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.32.gate_proj.weight_scale": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.32.up_proj.weight": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.32.up_proj.weight_scale": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.33.down_proj.weight": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.33.down_proj.weight_scale": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.33.gate_proj.weight": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.33.gate_proj.weight_scale": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.33.up_proj.weight": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.33.up_proj.weight_scale": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.34.down_proj.weight": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.34.down_proj.weight_scale": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.34.gate_proj.weight": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.34.gate_proj.weight_scale": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.34.up_proj.weight": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.34.up_proj.weight_scale": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.35.down_proj.weight": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.35.down_proj.weight_scale": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.35.gate_proj.weight": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.35.gate_proj.weight_scale": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.35.up_proj.weight": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.35.up_proj.weight_scale": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.36.down_proj.weight": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.36.down_proj.weight_scale": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.36.gate_proj.weight": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.36.gate_proj.weight_scale": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.36.up_proj.weight": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.36.up_proj.weight_scale": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.37.down_proj.weight": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.37.down_proj.weight_scale": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.37.gate_proj.weight": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.37.gate_proj.weight_scale": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.37.up_proj.weight": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.37.up_proj.weight_scale": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.38.down_proj.weight": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.38.down_proj.weight_scale": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.38.gate_proj.weight": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.38.gate_proj.weight_scale": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.38.up_proj.weight": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.38.up_proj.weight_scale": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.39.down_proj.weight": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.39.down_proj.weight_scale": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.39.gate_proj.weight": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.39.gate_proj.weight_scale": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.39.up_proj.weight": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.39.up_proj.weight_scale": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.4.down_proj.weight": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.4.down_proj.weight_scale": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.4.gate_proj.weight": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.4.gate_proj.weight_scale": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.4.up_proj.weight": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.4.up_proj.weight_scale": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.40.down_proj.weight": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.40.down_proj.weight_scale": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.40.gate_proj.weight": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.40.gate_proj.weight_scale": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.40.up_proj.weight": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.40.up_proj.weight_scale": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.41.down_proj.weight": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.41.down_proj.weight_scale": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.41.gate_proj.weight": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.41.gate_proj.weight_scale": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.41.up_proj.weight": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.41.up_proj.weight_scale": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.42.down_proj.weight": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.42.down_proj.weight_scale": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.42.gate_proj.weight": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.42.gate_proj.weight_scale": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.42.up_proj.weight": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.42.up_proj.weight_scale": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.43.down_proj.weight": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.43.down_proj.weight_scale": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.43.gate_proj.weight": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.43.gate_proj.weight_scale": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.43.up_proj.weight": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.43.up_proj.weight_scale": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.44.down_proj.weight": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.44.down_proj.weight_scale": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.44.gate_proj.weight": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.44.gate_proj.weight_scale": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.44.up_proj.weight": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.44.up_proj.weight_scale": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.45.down_proj.weight": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.45.down_proj.weight_scale": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.45.gate_proj.weight": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.45.gate_proj.weight_scale": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.45.up_proj.weight": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.45.up_proj.weight_scale": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.46.down_proj.weight": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.46.down_proj.weight_scale": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.46.gate_proj.weight": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.46.gate_proj.weight_scale": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.46.up_proj.weight": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.46.up_proj.weight_scale": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.47.down_proj.weight": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.47.down_proj.weight_scale": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.47.gate_proj.weight": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.47.gate_proj.weight_scale": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.47.up_proj.weight": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.47.up_proj.weight_scale": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.48.down_proj.weight": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.48.down_proj.weight_scale": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.48.gate_proj.weight": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.48.gate_proj.weight_scale": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.48.up_proj.weight": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.48.up_proj.weight_scale": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.49.down_proj.weight": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.49.down_proj.weight_scale": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.49.gate_proj.weight": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.49.gate_proj.weight_scale": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.49.up_proj.weight": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.49.up_proj.weight_scale": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.5.down_proj.weight": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.5.down_proj.weight_scale": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.5.gate_proj.weight": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.5.gate_proj.weight_scale": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.5.up_proj.weight": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.5.up_proj.weight_scale": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.50.down_proj.weight": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.50.down_proj.weight_scale": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.50.gate_proj.weight": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.50.gate_proj.weight_scale": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.50.up_proj.weight": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.50.up_proj.weight_scale": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.51.down_proj.weight": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.51.down_proj.weight_scale": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.51.gate_proj.weight": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.51.gate_proj.weight_scale": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.51.up_proj.weight": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.51.up_proj.weight_scale": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.52.down_proj.weight": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.52.down_proj.weight_scale": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.52.gate_proj.weight": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.52.gate_proj.weight_scale": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.52.up_proj.weight": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.52.up_proj.weight_scale": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.53.down_proj.weight": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.53.down_proj.weight_scale": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.53.gate_proj.weight": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.53.gate_proj.weight_scale": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.53.up_proj.weight": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.53.up_proj.weight_scale": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.54.down_proj.weight": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.54.down_proj.weight_scale": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.54.gate_proj.weight": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.54.gate_proj.weight_scale": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.54.up_proj.weight": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.54.up_proj.weight_scale": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.55.down_proj.weight": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.55.down_proj.weight_scale": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.55.gate_proj.weight": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.55.gate_proj.weight_scale": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.55.up_proj.weight": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.55.up_proj.weight_scale": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.56.down_proj.weight": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.56.down_proj.weight_scale": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.56.gate_proj.weight": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.56.gate_proj.weight_scale": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.56.up_proj.weight": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.56.up_proj.weight_scale": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.57.down_proj.weight": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.57.down_proj.weight_scale": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.57.gate_proj.weight": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.57.gate_proj.weight_scale": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.57.up_proj.weight": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.57.up_proj.weight_scale": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.58.down_proj.weight": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.58.down_proj.weight_scale": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.58.gate_proj.weight": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.58.gate_proj.weight_scale": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.58.up_proj.weight": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.58.up_proj.weight_scale": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.59.down_proj.weight": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.59.down_proj.weight_scale": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.59.gate_proj.weight": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.59.gate_proj.weight_scale": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.59.up_proj.weight": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.59.up_proj.weight_scale": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.6.down_proj.weight": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.6.down_proj.weight_scale": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.6.gate_proj.weight": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.6.gate_proj.weight_scale": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.6.up_proj.weight": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.6.up_proj.weight_scale": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.60.down_proj.weight": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.60.down_proj.weight_scale": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.60.gate_proj.weight": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.60.gate_proj.weight_scale": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.60.up_proj.weight": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.60.up_proj.weight_scale": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.61.down_proj.weight": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.61.down_proj.weight_scale": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.61.gate_proj.weight": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.61.gate_proj.weight_scale": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.61.up_proj.weight": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.61.up_proj.weight_scale": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.62.down_proj.weight": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.62.down_proj.weight_scale": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.62.gate_proj.weight": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.62.gate_proj.weight_scale": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.62.up_proj.weight": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.62.up_proj.weight_scale": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.63.down_proj.weight": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.63.down_proj.weight_scale": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.63.gate_proj.weight": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.63.gate_proj.weight_scale": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.63.up_proj.weight": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.63.up_proj.weight_scale": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.64.down_proj.weight": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.64.down_proj.weight_scale": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.64.gate_proj.weight": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.64.gate_proj.weight_scale": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.64.up_proj.weight": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.64.up_proj.weight_scale": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.65.down_proj.weight": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.65.down_proj.weight_scale": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.65.gate_proj.weight": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.65.gate_proj.weight_scale": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.65.up_proj.weight": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.65.up_proj.weight_scale": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.66.down_proj.weight": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.66.down_proj.weight_scale": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.66.gate_proj.weight": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.66.gate_proj.weight_scale": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.66.up_proj.weight": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.66.up_proj.weight_scale": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.67.down_proj.weight": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.67.down_proj.weight_scale": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.67.gate_proj.weight": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.67.gate_proj.weight_scale": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.67.up_proj.weight": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.67.up_proj.weight_scale": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.68.down_proj.weight": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.68.down_proj.weight_scale": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.68.gate_proj.weight": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.68.gate_proj.weight_scale": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.68.up_proj.weight": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.68.up_proj.weight_scale": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.69.down_proj.weight": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.69.down_proj.weight_scale": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.69.gate_proj.weight": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.69.gate_proj.weight_scale": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.69.up_proj.weight": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.69.up_proj.weight_scale": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.7.down_proj.weight": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.7.down_proj.weight_scale": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.7.gate_proj.weight": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.7.gate_proj.weight_scale": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.7.up_proj.weight": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.7.up_proj.weight_scale": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.70.down_proj.weight": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.70.down_proj.weight_scale": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.70.gate_proj.weight": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.70.gate_proj.weight_scale": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.70.up_proj.weight": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.70.up_proj.weight_scale": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.71.down_proj.weight": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.71.down_proj.weight_scale": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.71.gate_proj.weight": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.71.gate_proj.weight_scale": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.71.up_proj.weight": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.71.up_proj.weight_scale": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.72.down_proj.weight": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.72.down_proj.weight_scale": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.72.gate_proj.weight": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.72.gate_proj.weight_scale": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.72.up_proj.weight": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.72.up_proj.weight_scale": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.73.down_proj.weight": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.73.down_proj.weight_scale": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.73.gate_proj.weight": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.73.gate_proj.weight_scale": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.73.up_proj.weight": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.73.up_proj.weight_scale": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.74.down_proj.weight": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.74.down_proj.weight_scale": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.74.gate_proj.weight": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.74.gate_proj.weight_scale": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.74.up_proj.weight": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.74.up_proj.weight_scale": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.75.down_proj.weight": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.75.down_proj.weight_scale": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.75.gate_proj.weight": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.75.gate_proj.weight_scale": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.75.up_proj.weight": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.75.up_proj.weight_scale": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.76.down_proj.weight": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.76.down_proj.weight_scale": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.76.gate_proj.weight": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.76.gate_proj.weight_scale": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.76.up_proj.weight": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.76.up_proj.weight_scale": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.77.down_proj.weight": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.77.down_proj.weight_scale": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.77.gate_proj.weight": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.77.gate_proj.weight_scale": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.77.up_proj.weight": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.77.up_proj.weight_scale": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.78.down_proj.weight": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.78.down_proj.weight_scale": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.78.gate_proj.weight": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.78.gate_proj.weight_scale": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.78.up_proj.weight": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.78.up_proj.weight_scale": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.79.down_proj.weight": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.79.down_proj.weight_scale": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.79.gate_proj.weight": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.79.gate_proj.weight_scale": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.79.up_proj.weight": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.79.up_proj.weight_scale": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.8.down_proj.weight": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.8.down_proj.weight_scale": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.8.gate_proj.weight": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.8.gate_proj.weight_scale": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.8.up_proj.weight": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.8.up_proj.weight_scale": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.80.down_proj.weight": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.80.down_proj.weight_scale": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.80.gate_proj.weight": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.80.gate_proj.weight_scale": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.80.up_proj.weight": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.80.up_proj.weight_scale": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.81.down_proj.weight": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.81.down_proj.weight_scale": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.81.gate_proj.weight": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.81.gate_proj.weight_scale": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.81.up_proj.weight": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.81.up_proj.weight_scale": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.82.down_proj.weight": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.82.down_proj.weight_scale": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.82.gate_proj.weight": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.82.gate_proj.weight_scale": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.82.up_proj.weight": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.82.up_proj.weight_scale": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.83.down_proj.weight": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.83.down_proj.weight_scale": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.83.gate_proj.weight": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.83.gate_proj.weight_scale": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.83.up_proj.weight": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.83.up_proj.weight_scale": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.84.down_proj.weight": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.84.down_proj.weight_scale": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.84.gate_proj.weight": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.84.gate_proj.weight_scale": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.84.up_proj.weight": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.84.up_proj.weight_scale": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.85.down_proj.weight": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.85.down_proj.weight_scale": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.85.gate_proj.weight": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.85.gate_proj.weight_scale": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.85.up_proj.weight": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.85.up_proj.weight_scale": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.86.down_proj.weight": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.86.down_proj.weight_scale": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.86.gate_proj.weight": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.86.gate_proj.weight_scale": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.86.up_proj.weight": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.86.up_proj.weight_scale": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.87.down_proj.weight": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.87.down_proj.weight_scale": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.87.gate_proj.weight": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.87.gate_proj.weight_scale": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.87.up_proj.weight": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.87.up_proj.weight_scale": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.88.down_proj.weight": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.88.down_proj.weight_scale": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.88.gate_proj.weight": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.88.gate_proj.weight_scale": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.88.up_proj.weight": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.88.up_proj.weight_scale": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.89.down_proj.weight": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.89.down_proj.weight_scale": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.89.gate_proj.weight": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.89.gate_proj.weight_scale": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.89.up_proj.weight": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.89.up_proj.weight_scale": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.9.down_proj.weight": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.9.down_proj.weight_scale": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.9.gate_proj.weight": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.9.gate_proj.weight_scale": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.9.up_proj.weight": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.9.up_proj.weight_scale": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.90.down_proj.weight": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.90.down_proj.weight_scale": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.90.gate_proj.weight": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.90.gate_proj.weight_scale": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.90.up_proj.weight": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.90.up_proj.weight_scale": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.91.down_proj.weight": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.91.down_proj.weight_scale": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.91.gate_proj.weight": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.91.gate_proj.weight_scale": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.91.up_proj.weight": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.91.up_proj.weight_scale": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.92.down_proj.weight": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.92.down_proj.weight_scale": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.92.gate_proj.weight": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.92.gate_proj.weight_scale": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.92.up_proj.weight": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.92.up_proj.weight_scale": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.93.down_proj.weight": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.93.down_proj.weight_scale": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.93.gate_proj.weight": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.93.gate_proj.weight_scale": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.93.up_proj.weight": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.93.up_proj.weight_scale": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.94.down_proj.weight": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.94.down_proj.weight_scale": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.94.gate_proj.weight": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.94.gate_proj.weight_scale": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.94.up_proj.weight": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.94.up_proj.weight_scale": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.95.down_proj.weight": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.95.down_proj.weight_scale": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.95.gate_proj.weight": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.95.gate_proj.weight_scale": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.95.up_proj.weight": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.95.up_proj.weight_scale": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.96.down_proj.weight": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.96.down_proj.weight_scale": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.96.gate_proj.weight": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.96.gate_proj.weight_scale": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.96.up_proj.weight": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.96.up_proj.weight_scale": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.97.down_proj.weight": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.97.down_proj.weight_scale": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.97.gate_proj.weight": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.97.gate_proj.weight_scale": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.97.up_proj.weight": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.97.up_proj.weight_scale": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.98.down_proj.weight": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.98.down_proj.weight_scale": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.98.gate_proj.weight": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.98.gate_proj.weight_scale": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.98.up_proj.weight": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.98.up_proj.weight_scale": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.99.down_proj.weight": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.99.down_proj.weight_scale": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.99.gate_proj.weight": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.99.gate_proj.weight_scale": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.99.up_proj.weight": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.99.up_proj.weight_scale": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.gate.e_score_correction_bias": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.gate.weight": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.shared_experts.down_proj.weight": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.shared_experts.down_proj.weight_scale": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.shared_experts.gate_proj.weight": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.shared_experts.gate_proj.weight_scale": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.shared_experts.up_proj.weight": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.shared_experts.up_proj.weight_scale": "model-00072-of-00092.safetensors",
+ "model.layers.71.post_attention_layernorm.weight": "model-00072-of-00092.safetensors",
+ "model.layers.71.self_attn.k_norm.weight": "model-00072-of-00092.safetensors",
+ "model.layers.71.self_attn.k_proj.bias": "model-00072-of-00092.safetensors",
+ "model.layers.71.self_attn.k_proj.weight": "model-00072-of-00092.safetensors",
+ "model.layers.71.self_attn.k_proj.weight_scale": "model-00072-of-00092.safetensors",
+ "model.layers.71.self_attn.o_proj.weight": "model-00072-of-00092.safetensors",
+ "model.layers.71.self_attn.o_proj.weight_scale": "model-00072-of-00092.safetensors",
+ "model.layers.71.self_attn.q_norm.weight": "model-00072-of-00092.safetensors",
+ "model.layers.71.self_attn.q_proj.bias": "model-00072-of-00092.safetensors",
+ "model.layers.71.self_attn.q_proj.weight": "model-00072-of-00092.safetensors",
+ "model.layers.71.self_attn.q_proj.weight_scale": "model-00072-of-00092.safetensors",
+ "model.layers.71.self_attn.v_proj.bias": "model-00072-of-00092.safetensors",
+ "model.layers.71.self_attn.v_proj.weight": "model-00072-of-00092.safetensors",
+ "model.layers.71.self_attn.v_proj.weight_scale": "model-00072-of-00092.safetensors",
+ "model.layers.72.input_layernorm.weight": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.0.down_proj.weight": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.0.down_proj.weight_scale": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.0.gate_proj.weight": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.0.gate_proj.weight_scale": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.0.up_proj.weight": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.0.up_proj.weight_scale": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.1.down_proj.weight": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.1.down_proj.weight_scale": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.1.gate_proj.weight": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.1.gate_proj.weight_scale": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.1.up_proj.weight": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.1.up_proj.weight_scale": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.10.down_proj.weight": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.10.down_proj.weight_scale": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.10.gate_proj.weight": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.10.gate_proj.weight_scale": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.10.up_proj.weight": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.10.up_proj.weight_scale": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.100.down_proj.weight": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.100.down_proj.weight_scale": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.100.gate_proj.weight": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.100.gate_proj.weight_scale": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.100.up_proj.weight": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.100.up_proj.weight_scale": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.101.down_proj.weight": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.101.down_proj.weight_scale": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.101.gate_proj.weight": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.101.gate_proj.weight_scale": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.101.up_proj.weight": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.101.up_proj.weight_scale": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.102.down_proj.weight": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.102.down_proj.weight_scale": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.102.gate_proj.weight": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.102.gate_proj.weight_scale": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.102.up_proj.weight": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.102.up_proj.weight_scale": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.103.down_proj.weight": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.103.down_proj.weight_scale": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.103.gate_proj.weight": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.103.gate_proj.weight_scale": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.103.up_proj.weight": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.103.up_proj.weight_scale": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.104.down_proj.weight": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.104.down_proj.weight_scale": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.104.gate_proj.weight": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.104.gate_proj.weight_scale": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.104.up_proj.weight": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.104.up_proj.weight_scale": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.105.down_proj.weight": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.105.down_proj.weight_scale": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.105.gate_proj.weight": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.105.gate_proj.weight_scale": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.105.up_proj.weight": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.105.up_proj.weight_scale": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.106.down_proj.weight": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.106.down_proj.weight_scale": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.106.gate_proj.weight": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.106.gate_proj.weight_scale": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.106.up_proj.weight": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.106.up_proj.weight_scale": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.107.down_proj.weight": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.107.down_proj.weight_scale": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.107.gate_proj.weight": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.107.gate_proj.weight_scale": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.107.up_proj.weight": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.107.up_proj.weight_scale": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.108.down_proj.weight": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.108.down_proj.weight_scale": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.108.gate_proj.weight": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.108.gate_proj.weight_scale": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.108.up_proj.weight": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.108.up_proj.weight_scale": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.109.down_proj.weight": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.109.down_proj.weight_scale": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.109.gate_proj.weight": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.109.gate_proj.weight_scale": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.109.up_proj.weight": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.109.up_proj.weight_scale": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.11.down_proj.weight": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.11.down_proj.weight_scale": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.11.gate_proj.weight": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.11.gate_proj.weight_scale": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.11.up_proj.weight": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.11.up_proj.weight_scale": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.110.down_proj.weight": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.110.down_proj.weight_scale": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.110.gate_proj.weight": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.110.gate_proj.weight_scale": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.110.up_proj.weight": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.110.up_proj.weight_scale": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.111.down_proj.weight": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.111.down_proj.weight_scale": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.111.gate_proj.weight": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.111.gate_proj.weight_scale": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.111.up_proj.weight": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.111.up_proj.weight_scale": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.112.down_proj.weight": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.112.down_proj.weight_scale": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.112.gate_proj.weight": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.112.gate_proj.weight_scale": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.112.up_proj.weight": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.112.up_proj.weight_scale": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.113.down_proj.weight": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.113.down_proj.weight_scale": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.113.gate_proj.weight": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.113.gate_proj.weight_scale": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.113.up_proj.weight": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.113.up_proj.weight_scale": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.114.down_proj.weight": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.114.down_proj.weight_scale": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.114.gate_proj.weight": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.114.gate_proj.weight_scale": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.114.up_proj.weight": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.114.up_proj.weight_scale": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.115.down_proj.weight": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.115.down_proj.weight_scale": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.115.gate_proj.weight": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.115.gate_proj.weight_scale": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.115.up_proj.weight": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.115.up_proj.weight_scale": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.116.down_proj.weight": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.116.down_proj.weight_scale": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.116.gate_proj.weight": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.116.gate_proj.weight_scale": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.116.up_proj.weight": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.116.up_proj.weight_scale": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.117.down_proj.weight": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.117.down_proj.weight_scale": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.117.gate_proj.weight": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.117.gate_proj.weight_scale": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.117.up_proj.weight": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.117.up_proj.weight_scale": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.118.down_proj.weight": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.118.down_proj.weight_scale": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.118.gate_proj.weight": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.118.gate_proj.weight_scale": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.118.up_proj.weight": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.118.up_proj.weight_scale": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.119.down_proj.weight": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.119.down_proj.weight_scale": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.119.gate_proj.weight": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.119.gate_proj.weight_scale": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.119.up_proj.weight": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.119.up_proj.weight_scale": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.12.down_proj.weight": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.12.down_proj.weight_scale": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.12.gate_proj.weight": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.12.gate_proj.weight_scale": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.12.up_proj.weight": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.12.up_proj.weight_scale": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.120.down_proj.weight": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.120.down_proj.weight_scale": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.120.gate_proj.weight": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.120.gate_proj.weight_scale": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.120.up_proj.weight": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.120.up_proj.weight_scale": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.121.down_proj.weight": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.121.down_proj.weight_scale": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.121.gate_proj.weight": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.121.gate_proj.weight_scale": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.121.up_proj.weight": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.121.up_proj.weight_scale": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.122.down_proj.weight": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.122.down_proj.weight_scale": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.122.gate_proj.weight": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.122.gate_proj.weight_scale": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.122.up_proj.weight": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.122.up_proj.weight_scale": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.123.down_proj.weight": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.123.down_proj.weight_scale": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.123.gate_proj.weight": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.123.gate_proj.weight_scale": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.123.up_proj.weight": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.123.up_proj.weight_scale": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.124.down_proj.weight": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.124.down_proj.weight_scale": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.124.gate_proj.weight": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.124.gate_proj.weight_scale": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.124.up_proj.weight": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.124.up_proj.weight_scale": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.125.down_proj.weight": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.125.down_proj.weight_scale": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.125.gate_proj.weight": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.125.gate_proj.weight_scale": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.125.up_proj.weight": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.125.up_proj.weight_scale": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.126.down_proj.weight": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.126.down_proj.weight_scale": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.126.gate_proj.weight": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.126.gate_proj.weight_scale": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.126.up_proj.weight": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.126.up_proj.weight_scale": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.127.down_proj.weight": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.127.down_proj.weight_scale": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.127.gate_proj.weight": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.127.gate_proj.weight_scale": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.127.up_proj.weight": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.127.up_proj.weight_scale": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.128.down_proj.weight": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.128.down_proj.weight_scale": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.128.gate_proj.weight": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.128.gate_proj.weight_scale": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.128.up_proj.weight": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.128.up_proj.weight_scale": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.129.down_proj.weight": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.129.down_proj.weight_scale": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.129.gate_proj.weight": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.129.gate_proj.weight_scale": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.129.up_proj.weight": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.129.up_proj.weight_scale": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.13.down_proj.weight": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.13.down_proj.weight_scale": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.13.gate_proj.weight": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.13.gate_proj.weight_scale": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.13.up_proj.weight": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.13.up_proj.weight_scale": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.130.down_proj.weight": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.130.down_proj.weight_scale": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.130.gate_proj.weight": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.130.gate_proj.weight_scale": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.130.up_proj.weight": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.130.up_proj.weight_scale": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.131.down_proj.weight": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.131.down_proj.weight_scale": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.131.gate_proj.weight": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.131.gate_proj.weight_scale": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.131.up_proj.weight": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.131.up_proj.weight_scale": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.132.down_proj.weight": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.132.down_proj.weight_scale": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.132.gate_proj.weight": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.132.gate_proj.weight_scale": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.132.up_proj.weight": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.132.up_proj.weight_scale": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.133.down_proj.weight": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.133.down_proj.weight_scale": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.133.gate_proj.weight": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.133.gate_proj.weight_scale": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.133.up_proj.weight": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.133.up_proj.weight_scale": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.134.down_proj.weight": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.134.down_proj.weight_scale": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.134.gate_proj.weight": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.134.gate_proj.weight_scale": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.134.up_proj.weight": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.134.up_proj.weight_scale": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.135.down_proj.weight": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.135.down_proj.weight_scale": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.135.gate_proj.weight": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.135.gate_proj.weight_scale": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.135.up_proj.weight": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.135.up_proj.weight_scale": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.136.down_proj.weight": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.136.down_proj.weight_scale": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.136.gate_proj.weight": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.136.gate_proj.weight_scale": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.136.up_proj.weight": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.136.up_proj.weight_scale": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.137.down_proj.weight": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.137.down_proj.weight_scale": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.137.gate_proj.weight": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.137.gate_proj.weight_scale": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.137.up_proj.weight": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.137.up_proj.weight_scale": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.138.down_proj.weight": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.138.down_proj.weight_scale": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.138.gate_proj.weight": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.138.gate_proj.weight_scale": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.138.up_proj.weight": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.138.up_proj.weight_scale": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.139.down_proj.weight": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.139.down_proj.weight_scale": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.139.gate_proj.weight": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.139.gate_proj.weight_scale": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.139.up_proj.weight": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.139.up_proj.weight_scale": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.14.down_proj.weight": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.14.down_proj.weight_scale": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.14.gate_proj.weight": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.14.gate_proj.weight_scale": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.14.up_proj.weight": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.14.up_proj.weight_scale": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.140.down_proj.weight": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.140.down_proj.weight_scale": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.140.gate_proj.weight": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.140.gate_proj.weight_scale": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.140.up_proj.weight": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.140.up_proj.weight_scale": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.141.down_proj.weight": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.141.down_proj.weight_scale": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.141.gate_proj.weight": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.141.gate_proj.weight_scale": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.141.up_proj.weight": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.141.up_proj.weight_scale": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.142.down_proj.weight": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.142.down_proj.weight_scale": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.142.gate_proj.weight": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.142.gate_proj.weight_scale": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.142.up_proj.weight": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.142.up_proj.weight_scale": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.143.down_proj.weight": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.143.down_proj.weight_scale": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.143.gate_proj.weight": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.143.gate_proj.weight_scale": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.143.up_proj.weight": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.143.up_proj.weight_scale": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.144.down_proj.weight": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.144.down_proj.weight_scale": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.144.gate_proj.weight": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.144.gate_proj.weight_scale": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.144.up_proj.weight": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.144.up_proj.weight_scale": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.145.down_proj.weight": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.145.down_proj.weight_scale": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.145.gate_proj.weight": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.145.gate_proj.weight_scale": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.145.up_proj.weight": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.145.up_proj.weight_scale": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.146.down_proj.weight": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.146.down_proj.weight_scale": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.146.gate_proj.weight": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.146.gate_proj.weight_scale": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.146.up_proj.weight": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.146.up_proj.weight_scale": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.147.down_proj.weight": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.147.down_proj.weight_scale": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.147.gate_proj.weight": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.147.gate_proj.weight_scale": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.147.up_proj.weight": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.147.up_proj.weight_scale": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.148.down_proj.weight": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.148.down_proj.weight_scale": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.148.gate_proj.weight": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.148.gate_proj.weight_scale": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.148.up_proj.weight": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.148.up_proj.weight_scale": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.149.down_proj.weight": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.149.down_proj.weight_scale": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.149.gate_proj.weight": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.149.gate_proj.weight_scale": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.149.up_proj.weight": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.149.up_proj.weight_scale": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.15.down_proj.weight": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.15.down_proj.weight_scale": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.15.gate_proj.weight": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.15.gate_proj.weight_scale": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.15.up_proj.weight": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.15.up_proj.weight_scale": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.150.down_proj.weight": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.150.down_proj.weight_scale": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.150.gate_proj.weight": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.150.gate_proj.weight_scale": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.150.up_proj.weight": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.150.up_proj.weight_scale": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.151.down_proj.weight": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.151.down_proj.weight_scale": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.151.gate_proj.weight": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.151.gate_proj.weight_scale": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.151.up_proj.weight": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.151.up_proj.weight_scale": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.152.down_proj.weight": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.152.down_proj.weight_scale": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.152.gate_proj.weight": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.152.gate_proj.weight_scale": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.152.up_proj.weight": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.152.up_proj.weight_scale": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.153.down_proj.weight": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.153.down_proj.weight_scale": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.153.gate_proj.weight": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.153.gate_proj.weight_scale": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.153.up_proj.weight": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.153.up_proj.weight_scale": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.154.down_proj.weight": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.154.down_proj.weight_scale": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.154.gate_proj.weight": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.154.gate_proj.weight_scale": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.154.up_proj.weight": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.154.up_proj.weight_scale": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.155.down_proj.weight": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.155.down_proj.weight_scale": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.155.gate_proj.weight": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.155.gate_proj.weight_scale": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.155.up_proj.weight": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.155.up_proj.weight_scale": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.156.down_proj.weight": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.156.down_proj.weight_scale": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.156.gate_proj.weight": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.156.gate_proj.weight_scale": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.156.up_proj.weight": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.156.up_proj.weight_scale": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.157.down_proj.weight": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.157.down_proj.weight_scale": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.157.gate_proj.weight": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.157.gate_proj.weight_scale": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.157.up_proj.weight": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.157.up_proj.weight_scale": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.158.down_proj.weight": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.158.down_proj.weight_scale": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.158.gate_proj.weight": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.158.gate_proj.weight_scale": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.158.up_proj.weight": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.158.up_proj.weight_scale": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.159.down_proj.weight": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.159.down_proj.weight_scale": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.159.gate_proj.weight": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.159.gate_proj.weight_scale": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.159.up_proj.weight": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.159.up_proj.weight_scale": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.16.down_proj.weight": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.16.down_proj.weight_scale": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.16.gate_proj.weight": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.16.gate_proj.weight_scale": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.16.up_proj.weight": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.16.up_proj.weight_scale": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.17.down_proj.weight": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.17.down_proj.weight_scale": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.17.gate_proj.weight": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.17.gate_proj.weight_scale": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.17.up_proj.weight": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.17.up_proj.weight_scale": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.18.down_proj.weight": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.18.down_proj.weight_scale": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.18.gate_proj.weight": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.18.gate_proj.weight_scale": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.18.up_proj.weight": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.18.up_proj.weight_scale": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.19.down_proj.weight": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.19.down_proj.weight_scale": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.19.gate_proj.weight": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.19.gate_proj.weight_scale": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.19.up_proj.weight": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.19.up_proj.weight_scale": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.2.down_proj.weight": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.2.down_proj.weight_scale": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.2.gate_proj.weight": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.2.gate_proj.weight_scale": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.2.up_proj.weight": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.2.up_proj.weight_scale": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.20.down_proj.weight": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.20.down_proj.weight_scale": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.20.gate_proj.weight": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.20.gate_proj.weight_scale": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.20.up_proj.weight": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.20.up_proj.weight_scale": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.21.down_proj.weight": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.21.down_proj.weight_scale": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.21.gate_proj.weight": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.21.gate_proj.weight_scale": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.21.up_proj.weight": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.21.up_proj.weight_scale": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.22.down_proj.weight": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.22.down_proj.weight_scale": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.22.gate_proj.weight": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.22.gate_proj.weight_scale": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.22.up_proj.weight": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.22.up_proj.weight_scale": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.23.down_proj.weight": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.23.down_proj.weight_scale": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.23.gate_proj.weight": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.23.gate_proj.weight_scale": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.23.up_proj.weight": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.23.up_proj.weight_scale": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.24.down_proj.weight": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.24.down_proj.weight_scale": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.24.gate_proj.weight": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.24.gate_proj.weight_scale": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.24.up_proj.weight": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.24.up_proj.weight_scale": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.25.down_proj.weight": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.25.down_proj.weight_scale": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.25.gate_proj.weight": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.25.gate_proj.weight_scale": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.25.up_proj.weight": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.25.up_proj.weight_scale": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.26.down_proj.weight": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.26.down_proj.weight_scale": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.26.gate_proj.weight": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.26.gate_proj.weight_scale": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.26.up_proj.weight": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.26.up_proj.weight_scale": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.27.down_proj.weight": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.27.down_proj.weight_scale": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.27.gate_proj.weight": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.27.gate_proj.weight_scale": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.27.up_proj.weight": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.27.up_proj.weight_scale": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.28.down_proj.weight": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.28.down_proj.weight_scale": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.28.gate_proj.weight": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.28.gate_proj.weight_scale": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.28.up_proj.weight": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.28.up_proj.weight_scale": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.29.down_proj.weight": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.29.down_proj.weight_scale": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.29.gate_proj.weight": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.29.gate_proj.weight_scale": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.29.up_proj.weight": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.29.up_proj.weight_scale": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.3.down_proj.weight": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.3.down_proj.weight_scale": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.3.gate_proj.weight": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.3.gate_proj.weight_scale": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.3.up_proj.weight": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.3.up_proj.weight_scale": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.30.down_proj.weight": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.30.down_proj.weight_scale": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.30.gate_proj.weight": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.30.gate_proj.weight_scale": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.30.up_proj.weight": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.30.up_proj.weight_scale": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.31.down_proj.weight": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.31.down_proj.weight_scale": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.31.gate_proj.weight": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.31.gate_proj.weight_scale": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.31.up_proj.weight": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.31.up_proj.weight_scale": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.32.down_proj.weight": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.32.down_proj.weight_scale": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.32.gate_proj.weight": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.32.gate_proj.weight_scale": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.32.up_proj.weight": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.32.up_proj.weight_scale": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.33.down_proj.weight": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.33.down_proj.weight_scale": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.33.gate_proj.weight": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.33.gate_proj.weight_scale": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.33.up_proj.weight": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.33.up_proj.weight_scale": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.34.down_proj.weight": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.34.down_proj.weight_scale": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.34.gate_proj.weight": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.34.gate_proj.weight_scale": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.34.up_proj.weight": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.34.up_proj.weight_scale": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.35.down_proj.weight": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.35.down_proj.weight_scale": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.35.gate_proj.weight": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.35.gate_proj.weight_scale": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.35.up_proj.weight": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.35.up_proj.weight_scale": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.36.down_proj.weight": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.36.down_proj.weight_scale": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.36.gate_proj.weight": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.36.gate_proj.weight_scale": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.36.up_proj.weight": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.36.up_proj.weight_scale": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.37.down_proj.weight": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.37.down_proj.weight_scale": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.37.gate_proj.weight": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.37.gate_proj.weight_scale": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.37.up_proj.weight": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.37.up_proj.weight_scale": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.38.down_proj.weight": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.38.down_proj.weight_scale": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.38.gate_proj.weight": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.38.gate_proj.weight_scale": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.38.up_proj.weight": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.38.up_proj.weight_scale": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.39.down_proj.weight": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.39.down_proj.weight_scale": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.39.gate_proj.weight": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.39.gate_proj.weight_scale": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.39.up_proj.weight": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.39.up_proj.weight_scale": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.4.down_proj.weight": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.4.down_proj.weight_scale": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.4.gate_proj.weight": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.4.gate_proj.weight_scale": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.4.up_proj.weight": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.4.up_proj.weight_scale": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.40.down_proj.weight": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.40.down_proj.weight_scale": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.40.gate_proj.weight": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.40.gate_proj.weight_scale": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.40.up_proj.weight": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.40.up_proj.weight_scale": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.41.down_proj.weight": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.41.down_proj.weight_scale": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.41.gate_proj.weight": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.41.gate_proj.weight_scale": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.41.up_proj.weight": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.41.up_proj.weight_scale": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.42.down_proj.weight": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.42.down_proj.weight_scale": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.42.gate_proj.weight": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.42.gate_proj.weight_scale": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.42.up_proj.weight": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.42.up_proj.weight_scale": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.43.down_proj.weight": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.43.down_proj.weight_scale": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.43.gate_proj.weight": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.43.gate_proj.weight_scale": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.43.up_proj.weight": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.43.up_proj.weight_scale": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.44.down_proj.weight": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.44.down_proj.weight_scale": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.44.gate_proj.weight": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.44.gate_proj.weight_scale": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.44.up_proj.weight": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.44.up_proj.weight_scale": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.45.down_proj.weight": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.45.down_proj.weight_scale": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.45.gate_proj.weight": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.45.gate_proj.weight_scale": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.45.up_proj.weight": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.45.up_proj.weight_scale": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.46.down_proj.weight": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.46.down_proj.weight_scale": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.46.gate_proj.weight": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.46.gate_proj.weight_scale": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.46.up_proj.weight": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.46.up_proj.weight_scale": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.47.down_proj.weight": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.47.down_proj.weight_scale": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.47.gate_proj.weight": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.47.gate_proj.weight_scale": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.47.up_proj.weight": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.47.up_proj.weight_scale": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.48.down_proj.weight": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.48.down_proj.weight_scale": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.48.gate_proj.weight": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.48.gate_proj.weight_scale": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.48.up_proj.weight": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.48.up_proj.weight_scale": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.49.down_proj.weight": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.49.down_proj.weight_scale": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.49.gate_proj.weight": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.49.gate_proj.weight_scale": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.49.up_proj.weight": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.49.up_proj.weight_scale": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.5.down_proj.weight": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.5.down_proj.weight_scale": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.5.gate_proj.weight": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.5.gate_proj.weight_scale": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.5.up_proj.weight": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.5.up_proj.weight_scale": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.50.down_proj.weight": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.50.down_proj.weight_scale": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.50.gate_proj.weight": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.50.gate_proj.weight_scale": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.50.up_proj.weight": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.50.up_proj.weight_scale": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.51.down_proj.weight": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.51.down_proj.weight_scale": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.51.gate_proj.weight": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.51.gate_proj.weight_scale": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.51.up_proj.weight": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.51.up_proj.weight_scale": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.52.down_proj.weight": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.52.down_proj.weight_scale": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.52.gate_proj.weight": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.52.gate_proj.weight_scale": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.52.up_proj.weight": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.52.up_proj.weight_scale": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.53.down_proj.weight": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.53.down_proj.weight_scale": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.53.gate_proj.weight": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.53.gate_proj.weight_scale": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.53.up_proj.weight": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.53.up_proj.weight_scale": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.54.down_proj.weight": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.54.down_proj.weight_scale": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.54.gate_proj.weight": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.54.gate_proj.weight_scale": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.54.up_proj.weight": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.54.up_proj.weight_scale": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.55.down_proj.weight": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.55.down_proj.weight_scale": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.55.gate_proj.weight": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.55.gate_proj.weight_scale": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.55.up_proj.weight": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.55.up_proj.weight_scale": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.56.down_proj.weight": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.56.down_proj.weight_scale": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.56.gate_proj.weight": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.56.gate_proj.weight_scale": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.56.up_proj.weight": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.56.up_proj.weight_scale": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.57.down_proj.weight": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.57.down_proj.weight_scale": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.57.gate_proj.weight": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.57.gate_proj.weight_scale": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.57.up_proj.weight": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.57.up_proj.weight_scale": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.58.down_proj.weight": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.58.down_proj.weight_scale": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.58.gate_proj.weight": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.58.gate_proj.weight_scale": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.58.up_proj.weight": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.58.up_proj.weight_scale": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.59.down_proj.weight": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.59.down_proj.weight_scale": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.59.gate_proj.weight": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.59.gate_proj.weight_scale": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.59.up_proj.weight": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.59.up_proj.weight_scale": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.6.down_proj.weight": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.6.down_proj.weight_scale": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.6.gate_proj.weight": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.6.gate_proj.weight_scale": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.6.up_proj.weight": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.6.up_proj.weight_scale": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.60.down_proj.weight": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.60.down_proj.weight_scale": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.60.gate_proj.weight": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.60.gate_proj.weight_scale": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.60.up_proj.weight": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.60.up_proj.weight_scale": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.61.down_proj.weight": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.61.down_proj.weight_scale": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.61.gate_proj.weight": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.61.gate_proj.weight_scale": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.61.up_proj.weight": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.61.up_proj.weight_scale": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.62.down_proj.weight": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.62.down_proj.weight_scale": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.62.gate_proj.weight": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.62.gate_proj.weight_scale": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.62.up_proj.weight": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.62.up_proj.weight_scale": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.63.down_proj.weight": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.63.down_proj.weight_scale": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.63.gate_proj.weight": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.63.gate_proj.weight_scale": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.63.up_proj.weight": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.63.up_proj.weight_scale": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.64.down_proj.weight": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.64.down_proj.weight_scale": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.64.gate_proj.weight": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.64.gate_proj.weight_scale": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.64.up_proj.weight": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.64.up_proj.weight_scale": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.65.down_proj.weight": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.65.down_proj.weight_scale": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.65.gate_proj.weight": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.65.gate_proj.weight_scale": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.65.up_proj.weight": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.65.up_proj.weight_scale": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.66.down_proj.weight": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.66.down_proj.weight_scale": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.66.gate_proj.weight": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.66.gate_proj.weight_scale": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.66.up_proj.weight": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.66.up_proj.weight_scale": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.67.down_proj.weight": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.67.down_proj.weight_scale": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.67.gate_proj.weight": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.67.gate_proj.weight_scale": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.67.up_proj.weight": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.67.up_proj.weight_scale": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.68.down_proj.weight": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.68.down_proj.weight_scale": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.68.gate_proj.weight": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.68.gate_proj.weight_scale": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.68.up_proj.weight": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.68.up_proj.weight_scale": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.69.down_proj.weight": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.69.down_proj.weight_scale": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.69.gate_proj.weight": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.69.gate_proj.weight_scale": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.69.up_proj.weight": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.69.up_proj.weight_scale": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.7.down_proj.weight": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.7.down_proj.weight_scale": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.7.gate_proj.weight": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.7.gate_proj.weight_scale": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.7.up_proj.weight": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.7.up_proj.weight_scale": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.70.down_proj.weight": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.70.down_proj.weight_scale": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.70.gate_proj.weight": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.70.gate_proj.weight_scale": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.70.up_proj.weight": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.70.up_proj.weight_scale": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.71.down_proj.weight": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.71.down_proj.weight_scale": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.71.gate_proj.weight": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.71.gate_proj.weight_scale": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.71.up_proj.weight": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.71.up_proj.weight_scale": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.72.down_proj.weight": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.72.down_proj.weight_scale": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.72.gate_proj.weight": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.72.gate_proj.weight_scale": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.72.up_proj.weight": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.72.up_proj.weight_scale": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.73.down_proj.weight": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.73.down_proj.weight_scale": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.73.gate_proj.weight": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.73.gate_proj.weight_scale": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.73.up_proj.weight": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.73.up_proj.weight_scale": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.74.down_proj.weight": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.74.down_proj.weight_scale": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.74.gate_proj.weight": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.74.gate_proj.weight_scale": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.74.up_proj.weight": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.74.up_proj.weight_scale": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.75.down_proj.weight": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.75.down_proj.weight_scale": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.75.gate_proj.weight": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.75.gate_proj.weight_scale": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.75.up_proj.weight": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.75.up_proj.weight_scale": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.76.down_proj.weight": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.76.down_proj.weight_scale": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.76.gate_proj.weight": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.76.gate_proj.weight_scale": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.76.up_proj.weight": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.76.up_proj.weight_scale": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.77.down_proj.weight": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.77.down_proj.weight_scale": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.77.gate_proj.weight": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.77.gate_proj.weight_scale": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.77.up_proj.weight": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.77.up_proj.weight_scale": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.78.down_proj.weight": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.78.down_proj.weight_scale": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.78.gate_proj.weight": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.78.gate_proj.weight_scale": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.78.up_proj.weight": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.78.up_proj.weight_scale": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.79.down_proj.weight": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.79.down_proj.weight_scale": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.79.gate_proj.weight": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.79.gate_proj.weight_scale": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.79.up_proj.weight": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.79.up_proj.weight_scale": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.8.down_proj.weight": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.8.down_proj.weight_scale": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.8.gate_proj.weight": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.8.gate_proj.weight_scale": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.8.up_proj.weight": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.8.up_proj.weight_scale": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.80.down_proj.weight": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.80.down_proj.weight_scale": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.80.gate_proj.weight": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.80.gate_proj.weight_scale": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.80.up_proj.weight": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.80.up_proj.weight_scale": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.81.down_proj.weight": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.81.down_proj.weight_scale": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.81.gate_proj.weight": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.81.gate_proj.weight_scale": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.81.up_proj.weight": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.81.up_proj.weight_scale": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.82.down_proj.weight": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.82.down_proj.weight_scale": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.82.gate_proj.weight": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.82.gate_proj.weight_scale": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.82.up_proj.weight": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.82.up_proj.weight_scale": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.83.down_proj.weight": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.83.down_proj.weight_scale": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.83.gate_proj.weight": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.83.gate_proj.weight_scale": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.83.up_proj.weight": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.83.up_proj.weight_scale": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.84.down_proj.weight": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.84.down_proj.weight_scale": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.84.gate_proj.weight": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.84.gate_proj.weight_scale": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.84.up_proj.weight": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.84.up_proj.weight_scale": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.85.down_proj.weight": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.85.down_proj.weight_scale": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.85.gate_proj.weight": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.85.gate_proj.weight_scale": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.85.up_proj.weight": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.85.up_proj.weight_scale": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.86.down_proj.weight": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.86.down_proj.weight_scale": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.86.gate_proj.weight": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.86.gate_proj.weight_scale": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.86.up_proj.weight": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.86.up_proj.weight_scale": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.87.down_proj.weight": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.87.down_proj.weight_scale": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.87.gate_proj.weight": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.87.gate_proj.weight_scale": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.87.up_proj.weight": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.87.up_proj.weight_scale": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.88.down_proj.weight": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.88.down_proj.weight_scale": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.88.gate_proj.weight": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.88.gate_proj.weight_scale": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.88.up_proj.weight": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.88.up_proj.weight_scale": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.89.down_proj.weight": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.89.down_proj.weight_scale": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.89.gate_proj.weight": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.89.gate_proj.weight_scale": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.89.up_proj.weight": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.89.up_proj.weight_scale": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.9.down_proj.weight": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.9.down_proj.weight_scale": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.9.gate_proj.weight": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.9.gate_proj.weight_scale": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.9.up_proj.weight": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.9.up_proj.weight_scale": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.90.down_proj.weight": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.90.down_proj.weight_scale": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.90.gate_proj.weight": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.90.gate_proj.weight_scale": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.90.up_proj.weight": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.90.up_proj.weight_scale": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.91.down_proj.weight": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.91.down_proj.weight_scale": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.91.gate_proj.weight": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.91.gate_proj.weight_scale": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.91.up_proj.weight": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.91.up_proj.weight_scale": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.92.down_proj.weight": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.92.down_proj.weight_scale": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.92.gate_proj.weight": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.92.gate_proj.weight_scale": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.92.up_proj.weight": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.92.up_proj.weight_scale": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.93.down_proj.weight": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.93.down_proj.weight_scale": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.93.gate_proj.weight": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.93.gate_proj.weight_scale": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.93.up_proj.weight": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.93.up_proj.weight_scale": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.94.down_proj.weight": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.94.down_proj.weight_scale": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.94.gate_proj.weight": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.94.gate_proj.weight_scale": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.94.up_proj.weight": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.94.up_proj.weight_scale": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.95.down_proj.weight": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.95.down_proj.weight_scale": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.95.gate_proj.weight": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.95.gate_proj.weight_scale": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.95.up_proj.weight": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.95.up_proj.weight_scale": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.96.down_proj.weight": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.96.down_proj.weight_scale": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.96.gate_proj.weight": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.96.gate_proj.weight_scale": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.96.up_proj.weight": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.96.up_proj.weight_scale": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.97.down_proj.weight": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.97.down_proj.weight_scale": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.97.gate_proj.weight": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.97.gate_proj.weight_scale": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.97.up_proj.weight": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.97.up_proj.weight_scale": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.98.down_proj.weight": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.98.down_proj.weight_scale": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.98.gate_proj.weight": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.98.gate_proj.weight_scale": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.98.up_proj.weight": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.98.up_proj.weight_scale": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.99.down_proj.weight": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.99.down_proj.weight_scale": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.99.gate_proj.weight": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.99.gate_proj.weight_scale": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.99.up_proj.weight": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.99.up_proj.weight_scale": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.gate.e_score_correction_bias": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.gate.weight": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.shared_experts.down_proj.weight": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.shared_experts.down_proj.weight_scale": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.shared_experts.gate_proj.weight": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.shared_experts.gate_proj.weight_scale": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.shared_experts.up_proj.weight": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.shared_experts.up_proj.weight_scale": "model-00073-of-00092.safetensors",
+ "model.layers.72.post_attention_layernorm.weight": "model-00073-of-00092.safetensors",
+ "model.layers.72.self_attn.k_norm.weight": "model-00073-of-00092.safetensors",
+ "model.layers.72.self_attn.k_proj.bias": "model-00073-of-00092.safetensors",
+ "model.layers.72.self_attn.k_proj.weight": "model-00073-of-00092.safetensors",
+ "model.layers.72.self_attn.k_proj.weight_scale": "model-00073-of-00092.safetensors",
+ "model.layers.72.self_attn.o_proj.weight": "model-00073-of-00092.safetensors",
+ "model.layers.72.self_attn.o_proj.weight_scale": "model-00073-of-00092.safetensors",
+ "model.layers.72.self_attn.q_norm.weight": "model-00073-of-00092.safetensors",
+ "model.layers.72.self_attn.q_proj.bias": "model-00073-of-00092.safetensors",
+ "model.layers.72.self_attn.q_proj.weight": "model-00073-of-00092.safetensors",
+ "model.layers.72.self_attn.q_proj.weight_scale": "model-00073-of-00092.safetensors",
+ "model.layers.72.self_attn.v_proj.bias": "model-00073-of-00092.safetensors",
+ "model.layers.72.self_attn.v_proj.weight": "model-00073-of-00092.safetensors",
+ "model.layers.72.self_attn.v_proj.weight_scale": "model-00073-of-00092.safetensors",
+ "model.layers.73.input_layernorm.weight": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.0.down_proj.weight": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.0.down_proj.weight_scale": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.0.gate_proj.weight": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.0.gate_proj.weight_scale": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.0.up_proj.weight": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.0.up_proj.weight_scale": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.1.down_proj.weight": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.1.down_proj.weight_scale": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.1.gate_proj.weight": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.1.gate_proj.weight_scale": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.1.up_proj.weight": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.1.up_proj.weight_scale": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.10.down_proj.weight": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.10.down_proj.weight_scale": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.10.gate_proj.weight": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.10.gate_proj.weight_scale": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.10.up_proj.weight": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.10.up_proj.weight_scale": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.100.down_proj.weight": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.100.down_proj.weight_scale": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.100.gate_proj.weight": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.100.gate_proj.weight_scale": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.100.up_proj.weight": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.100.up_proj.weight_scale": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.101.down_proj.weight": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.101.down_proj.weight_scale": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.101.gate_proj.weight": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.101.gate_proj.weight_scale": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.101.up_proj.weight": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.101.up_proj.weight_scale": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.102.down_proj.weight": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.102.down_proj.weight_scale": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.102.gate_proj.weight": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.102.gate_proj.weight_scale": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.102.up_proj.weight": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.102.up_proj.weight_scale": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.103.down_proj.weight": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.103.down_proj.weight_scale": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.103.gate_proj.weight": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.103.gate_proj.weight_scale": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.103.up_proj.weight": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.103.up_proj.weight_scale": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.104.down_proj.weight": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.104.down_proj.weight_scale": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.104.gate_proj.weight": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.104.gate_proj.weight_scale": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.104.up_proj.weight": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.104.up_proj.weight_scale": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.105.down_proj.weight": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.105.down_proj.weight_scale": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.105.gate_proj.weight": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.105.gate_proj.weight_scale": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.105.up_proj.weight": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.105.up_proj.weight_scale": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.106.down_proj.weight": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.106.down_proj.weight_scale": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.106.gate_proj.weight": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.106.gate_proj.weight_scale": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.106.up_proj.weight": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.106.up_proj.weight_scale": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.107.down_proj.weight": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.107.down_proj.weight_scale": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.107.gate_proj.weight": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.107.gate_proj.weight_scale": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.107.up_proj.weight": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.107.up_proj.weight_scale": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.108.down_proj.weight": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.108.down_proj.weight_scale": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.108.gate_proj.weight": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.108.gate_proj.weight_scale": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.108.up_proj.weight": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.108.up_proj.weight_scale": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.109.down_proj.weight": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.109.down_proj.weight_scale": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.109.gate_proj.weight": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.109.gate_proj.weight_scale": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.109.up_proj.weight": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.109.up_proj.weight_scale": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.11.down_proj.weight": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.11.down_proj.weight_scale": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.11.gate_proj.weight": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.11.gate_proj.weight_scale": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.11.up_proj.weight": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.11.up_proj.weight_scale": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.110.down_proj.weight": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.110.down_proj.weight_scale": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.110.gate_proj.weight": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.110.gate_proj.weight_scale": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.110.up_proj.weight": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.110.up_proj.weight_scale": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.111.down_proj.weight": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.111.down_proj.weight_scale": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.111.gate_proj.weight": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.111.gate_proj.weight_scale": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.111.up_proj.weight": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.111.up_proj.weight_scale": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.112.down_proj.weight": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.112.down_proj.weight_scale": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.112.gate_proj.weight": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.112.gate_proj.weight_scale": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.112.up_proj.weight": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.112.up_proj.weight_scale": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.113.down_proj.weight": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.113.down_proj.weight_scale": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.113.gate_proj.weight": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.113.gate_proj.weight_scale": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.113.up_proj.weight": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.113.up_proj.weight_scale": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.114.down_proj.weight": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.114.down_proj.weight_scale": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.114.gate_proj.weight": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.114.gate_proj.weight_scale": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.114.up_proj.weight": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.114.up_proj.weight_scale": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.115.down_proj.weight": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.115.down_proj.weight_scale": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.115.gate_proj.weight": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.115.gate_proj.weight_scale": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.115.up_proj.weight": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.115.up_proj.weight_scale": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.116.down_proj.weight": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.116.down_proj.weight_scale": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.116.gate_proj.weight": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.116.gate_proj.weight_scale": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.116.up_proj.weight": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.116.up_proj.weight_scale": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.117.down_proj.weight": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.117.down_proj.weight_scale": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.117.gate_proj.weight": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.117.gate_proj.weight_scale": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.117.up_proj.weight": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.117.up_proj.weight_scale": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.118.down_proj.weight": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.118.down_proj.weight_scale": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.118.gate_proj.weight": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.118.gate_proj.weight_scale": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.118.up_proj.weight": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.118.up_proj.weight_scale": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.119.down_proj.weight": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.119.down_proj.weight_scale": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.119.gate_proj.weight": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.119.gate_proj.weight_scale": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.119.up_proj.weight": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.119.up_proj.weight_scale": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.12.down_proj.weight": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.12.down_proj.weight_scale": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.12.gate_proj.weight": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.12.gate_proj.weight_scale": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.12.up_proj.weight": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.12.up_proj.weight_scale": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.120.down_proj.weight": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.120.down_proj.weight_scale": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.120.gate_proj.weight": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.120.gate_proj.weight_scale": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.120.up_proj.weight": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.120.up_proj.weight_scale": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.121.down_proj.weight": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.121.down_proj.weight_scale": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.121.gate_proj.weight": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.121.gate_proj.weight_scale": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.121.up_proj.weight": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.121.up_proj.weight_scale": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.122.down_proj.weight": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.122.down_proj.weight_scale": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.122.gate_proj.weight": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.122.gate_proj.weight_scale": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.122.up_proj.weight": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.122.up_proj.weight_scale": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.123.down_proj.weight": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.123.down_proj.weight_scale": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.123.gate_proj.weight": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.123.gate_proj.weight_scale": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.123.up_proj.weight": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.123.up_proj.weight_scale": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.124.down_proj.weight": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.124.down_proj.weight_scale": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.124.gate_proj.weight": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.124.gate_proj.weight_scale": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.124.up_proj.weight": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.124.up_proj.weight_scale": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.125.down_proj.weight": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.125.down_proj.weight_scale": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.125.gate_proj.weight": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.125.gate_proj.weight_scale": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.125.up_proj.weight": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.125.up_proj.weight_scale": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.126.down_proj.weight": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.126.down_proj.weight_scale": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.126.gate_proj.weight": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.126.gate_proj.weight_scale": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.126.up_proj.weight": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.126.up_proj.weight_scale": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.127.down_proj.weight": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.127.down_proj.weight_scale": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.127.gate_proj.weight": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.127.gate_proj.weight_scale": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.127.up_proj.weight": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.127.up_proj.weight_scale": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.128.down_proj.weight": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.128.down_proj.weight_scale": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.128.gate_proj.weight": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.128.gate_proj.weight_scale": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.128.up_proj.weight": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.128.up_proj.weight_scale": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.129.down_proj.weight": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.129.down_proj.weight_scale": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.129.gate_proj.weight": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.129.gate_proj.weight_scale": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.129.up_proj.weight": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.129.up_proj.weight_scale": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.13.down_proj.weight": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.13.down_proj.weight_scale": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.13.gate_proj.weight": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.13.gate_proj.weight_scale": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.13.up_proj.weight": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.13.up_proj.weight_scale": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.130.down_proj.weight": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.130.down_proj.weight_scale": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.130.gate_proj.weight": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.130.gate_proj.weight_scale": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.130.up_proj.weight": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.130.up_proj.weight_scale": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.131.down_proj.weight": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.131.down_proj.weight_scale": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.131.gate_proj.weight": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.131.gate_proj.weight_scale": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.131.up_proj.weight": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.131.up_proj.weight_scale": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.132.down_proj.weight": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.132.down_proj.weight_scale": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.132.gate_proj.weight": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.132.gate_proj.weight_scale": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.132.up_proj.weight": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.132.up_proj.weight_scale": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.133.down_proj.weight": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.133.down_proj.weight_scale": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.133.gate_proj.weight": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.133.gate_proj.weight_scale": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.133.up_proj.weight": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.133.up_proj.weight_scale": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.134.down_proj.weight": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.134.down_proj.weight_scale": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.134.gate_proj.weight": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.134.gate_proj.weight_scale": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.134.up_proj.weight": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.134.up_proj.weight_scale": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.135.down_proj.weight": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.135.down_proj.weight_scale": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.135.gate_proj.weight": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.135.gate_proj.weight_scale": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.135.up_proj.weight": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.135.up_proj.weight_scale": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.136.down_proj.weight": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.136.down_proj.weight_scale": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.136.gate_proj.weight": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.136.gate_proj.weight_scale": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.136.up_proj.weight": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.136.up_proj.weight_scale": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.137.down_proj.weight": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.137.down_proj.weight_scale": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.137.gate_proj.weight": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.137.gate_proj.weight_scale": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.137.up_proj.weight": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.137.up_proj.weight_scale": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.138.down_proj.weight": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.138.down_proj.weight_scale": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.138.gate_proj.weight": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.138.gate_proj.weight_scale": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.138.up_proj.weight": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.138.up_proj.weight_scale": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.139.down_proj.weight": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.139.down_proj.weight_scale": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.139.gate_proj.weight": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.139.gate_proj.weight_scale": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.139.up_proj.weight": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.139.up_proj.weight_scale": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.14.down_proj.weight": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.14.down_proj.weight_scale": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.14.gate_proj.weight": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.14.gate_proj.weight_scale": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.14.up_proj.weight": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.14.up_proj.weight_scale": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.140.down_proj.weight": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.140.down_proj.weight_scale": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.140.gate_proj.weight": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.140.gate_proj.weight_scale": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.140.up_proj.weight": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.140.up_proj.weight_scale": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.141.down_proj.weight": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.141.down_proj.weight_scale": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.141.gate_proj.weight": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.141.gate_proj.weight_scale": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.141.up_proj.weight": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.141.up_proj.weight_scale": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.142.down_proj.weight": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.142.down_proj.weight_scale": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.142.gate_proj.weight": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.142.gate_proj.weight_scale": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.142.up_proj.weight": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.142.up_proj.weight_scale": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.143.down_proj.weight": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.143.down_proj.weight_scale": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.143.gate_proj.weight": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.143.gate_proj.weight_scale": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.143.up_proj.weight": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.143.up_proj.weight_scale": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.144.down_proj.weight": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.144.down_proj.weight_scale": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.144.gate_proj.weight": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.144.gate_proj.weight_scale": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.144.up_proj.weight": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.144.up_proj.weight_scale": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.145.down_proj.weight": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.145.down_proj.weight_scale": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.145.gate_proj.weight": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.145.gate_proj.weight_scale": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.145.up_proj.weight": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.145.up_proj.weight_scale": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.146.down_proj.weight": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.146.down_proj.weight_scale": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.146.gate_proj.weight": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.146.gate_proj.weight_scale": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.146.up_proj.weight": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.146.up_proj.weight_scale": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.147.down_proj.weight": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.147.down_proj.weight_scale": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.147.gate_proj.weight": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.147.gate_proj.weight_scale": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.147.up_proj.weight": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.147.up_proj.weight_scale": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.148.down_proj.weight": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.148.down_proj.weight_scale": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.148.gate_proj.weight": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.148.gate_proj.weight_scale": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.148.up_proj.weight": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.148.up_proj.weight_scale": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.149.down_proj.weight": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.149.down_proj.weight_scale": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.149.gate_proj.weight": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.149.gate_proj.weight_scale": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.149.up_proj.weight": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.149.up_proj.weight_scale": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.15.down_proj.weight": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.15.down_proj.weight_scale": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.15.gate_proj.weight": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.15.gate_proj.weight_scale": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.15.up_proj.weight": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.15.up_proj.weight_scale": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.150.down_proj.weight": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.150.down_proj.weight_scale": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.150.gate_proj.weight": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.150.gate_proj.weight_scale": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.150.up_proj.weight": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.150.up_proj.weight_scale": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.151.down_proj.weight": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.151.down_proj.weight_scale": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.151.gate_proj.weight": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.151.gate_proj.weight_scale": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.151.up_proj.weight": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.151.up_proj.weight_scale": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.152.down_proj.weight": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.152.down_proj.weight_scale": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.152.gate_proj.weight": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.152.gate_proj.weight_scale": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.152.up_proj.weight": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.152.up_proj.weight_scale": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.153.down_proj.weight": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.153.down_proj.weight_scale": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.153.gate_proj.weight": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.153.gate_proj.weight_scale": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.153.up_proj.weight": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.153.up_proj.weight_scale": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.154.down_proj.weight": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.154.down_proj.weight_scale": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.154.gate_proj.weight": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.154.gate_proj.weight_scale": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.154.up_proj.weight": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.154.up_proj.weight_scale": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.155.down_proj.weight": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.155.down_proj.weight_scale": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.155.gate_proj.weight": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.155.gate_proj.weight_scale": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.155.up_proj.weight": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.155.up_proj.weight_scale": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.156.down_proj.weight": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.156.down_proj.weight_scale": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.156.gate_proj.weight": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.156.gate_proj.weight_scale": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.156.up_proj.weight": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.156.up_proj.weight_scale": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.157.down_proj.weight": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.157.down_proj.weight_scale": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.157.gate_proj.weight": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.157.gate_proj.weight_scale": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.157.up_proj.weight": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.157.up_proj.weight_scale": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.158.down_proj.weight": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.158.down_proj.weight_scale": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.158.gate_proj.weight": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.158.gate_proj.weight_scale": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.158.up_proj.weight": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.158.up_proj.weight_scale": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.159.down_proj.weight": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.159.down_proj.weight_scale": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.159.gate_proj.weight": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.159.gate_proj.weight_scale": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.159.up_proj.weight": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.159.up_proj.weight_scale": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.16.down_proj.weight": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.16.down_proj.weight_scale": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.16.gate_proj.weight": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.16.gate_proj.weight_scale": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.16.up_proj.weight": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.16.up_proj.weight_scale": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.17.down_proj.weight": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.17.down_proj.weight_scale": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.17.gate_proj.weight": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.17.gate_proj.weight_scale": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.17.up_proj.weight": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.17.up_proj.weight_scale": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.18.down_proj.weight": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.18.down_proj.weight_scale": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.18.gate_proj.weight": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.18.gate_proj.weight_scale": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.18.up_proj.weight": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.18.up_proj.weight_scale": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.19.down_proj.weight": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.19.down_proj.weight_scale": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.19.gate_proj.weight": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.19.gate_proj.weight_scale": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.19.up_proj.weight": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.19.up_proj.weight_scale": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.2.down_proj.weight": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.2.down_proj.weight_scale": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.2.gate_proj.weight": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.2.gate_proj.weight_scale": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.2.up_proj.weight": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.2.up_proj.weight_scale": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.20.down_proj.weight": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.20.down_proj.weight_scale": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.20.gate_proj.weight": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.20.gate_proj.weight_scale": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.20.up_proj.weight": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.20.up_proj.weight_scale": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.21.down_proj.weight": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.21.down_proj.weight_scale": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.21.gate_proj.weight": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.21.gate_proj.weight_scale": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.21.up_proj.weight": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.21.up_proj.weight_scale": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.22.down_proj.weight": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.22.down_proj.weight_scale": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.22.gate_proj.weight": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.22.gate_proj.weight_scale": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.22.up_proj.weight": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.22.up_proj.weight_scale": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.23.down_proj.weight": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.23.down_proj.weight_scale": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.23.gate_proj.weight": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.23.gate_proj.weight_scale": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.23.up_proj.weight": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.23.up_proj.weight_scale": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.24.down_proj.weight": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.24.down_proj.weight_scale": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.24.gate_proj.weight": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.24.gate_proj.weight_scale": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.24.up_proj.weight": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.24.up_proj.weight_scale": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.25.down_proj.weight": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.25.down_proj.weight_scale": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.25.gate_proj.weight": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.25.gate_proj.weight_scale": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.25.up_proj.weight": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.25.up_proj.weight_scale": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.26.down_proj.weight": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.26.down_proj.weight_scale": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.26.gate_proj.weight": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.26.gate_proj.weight_scale": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.26.up_proj.weight": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.26.up_proj.weight_scale": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.27.down_proj.weight": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.27.down_proj.weight_scale": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.27.gate_proj.weight": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.27.gate_proj.weight_scale": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.27.up_proj.weight": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.27.up_proj.weight_scale": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.28.down_proj.weight": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.28.down_proj.weight_scale": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.28.gate_proj.weight": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.28.gate_proj.weight_scale": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.28.up_proj.weight": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.28.up_proj.weight_scale": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.29.down_proj.weight": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.29.down_proj.weight_scale": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.29.gate_proj.weight": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.29.gate_proj.weight_scale": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.29.up_proj.weight": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.29.up_proj.weight_scale": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.3.down_proj.weight": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.3.down_proj.weight_scale": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.3.gate_proj.weight": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.3.gate_proj.weight_scale": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.3.up_proj.weight": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.3.up_proj.weight_scale": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.30.down_proj.weight": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.30.down_proj.weight_scale": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.30.gate_proj.weight": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.30.gate_proj.weight_scale": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.30.up_proj.weight": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.30.up_proj.weight_scale": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.31.down_proj.weight": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.31.down_proj.weight_scale": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.31.gate_proj.weight": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.31.gate_proj.weight_scale": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.31.up_proj.weight": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.31.up_proj.weight_scale": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.32.down_proj.weight": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.32.down_proj.weight_scale": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.32.gate_proj.weight": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.32.gate_proj.weight_scale": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.32.up_proj.weight": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.32.up_proj.weight_scale": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.33.down_proj.weight": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.33.down_proj.weight_scale": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.33.gate_proj.weight": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.33.gate_proj.weight_scale": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.33.up_proj.weight": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.33.up_proj.weight_scale": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.34.down_proj.weight": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.34.down_proj.weight_scale": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.34.gate_proj.weight": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.34.gate_proj.weight_scale": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.34.up_proj.weight": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.34.up_proj.weight_scale": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.35.down_proj.weight": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.35.down_proj.weight_scale": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.35.gate_proj.weight": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.35.gate_proj.weight_scale": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.35.up_proj.weight": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.35.up_proj.weight_scale": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.36.down_proj.weight": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.36.down_proj.weight_scale": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.36.gate_proj.weight": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.36.gate_proj.weight_scale": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.36.up_proj.weight": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.36.up_proj.weight_scale": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.37.down_proj.weight": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.37.down_proj.weight_scale": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.37.gate_proj.weight": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.37.gate_proj.weight_scale": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.37.up_proj.weight": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.37.up_proj.weight_scale": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.38.down_proj.weight": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.38.down_proj.weight_scale": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.38.gate_proj.weight": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.38.gate_proj.weight_scale": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.38.up_proj.weight": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.38.up_proj.weight_scale": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.39.down_proj.weight": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.39.down_proj.weight_scale": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.39.gate_proj.weight": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.39.gate_proj.weight_scale": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.39.up_proj.weight": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.39.up_proj.weight_scale": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.4.down_proj.weight": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.4.down_proj.weight_scale": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.4.gate_proj.weight": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.4.gate_proj.weight_scale": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.4.up_proj.weight": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.4.up_proj.weight_scale": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.40.down_proj.weight": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.40.down_proj.weight_scale": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.40.gate_proj.weight": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.40.gate_proj.weight_scale": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.40.up_proj.weight": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.40.up_proj.weight_scale": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.41.down_proj.weight": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.41.down_proj.weight_scale": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.41.gate_proj.weight": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.41.gate_proj.weight_scale": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.41.up_proj.weight": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.41.up_proj.weight_scale": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.42.down_proj.weight": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.42.down_proj.weight_scale": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.42.gate_proj.weight": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.42.gate_proj.weight_scale": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.42.up_proj.weight": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.42.up_proj.weight_scale": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.43.down_proj.weight": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.43.down_proj.weight_scale": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.43.gate_proj.weight": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.43.gate_proj.weight_scale": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.43.up_proj.weight": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.43.up_proj.weight_scale": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.44.down_proj.weight": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.44.down_proj.weight_scale": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.44.gate_proj.weight": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.44.gate_proj.weight_scale": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.44.up_proj.weight": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.44.up_proj.weight_scale": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.45.down_proj.weight": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.45.down_proj.weight_scale": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.45.gate_proj.weight": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.45.gate_proj.weight_scale": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.45.up_proj.weight": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.45.up_proj.weight_scale": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.46.down_proj.weight": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.46.down_proj.weight_scale": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.46.gate_proj.weight": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.46.gate_proj.weight_scale": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.46.up_proj.weight": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.46.up_proj.weight_scale": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.47.down_proj.weight": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.47.down_proj.weight_scale": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.47.gate_proj.weight": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.47.gate_proj.weight_scale": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.47.up_proj.weight": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.47.up_proj.weight_scale": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.48.down_proj.weight": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.48.down_proj.weight_scale": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.48.gate_proj.weight": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.48.gate_proj.weight_scale": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.48.up_proj.weight": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.48.up_proj.weight_scale": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.49.down_proj.weight": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.49.down_proj.weight_scale": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.49.gate_proj.weight": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.49.gate_proj.weight_scale": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.49.up_proj.weight": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.49.up_proj.weight_scale": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.5.down_proj.weight": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.5.down_proj.weight_scale": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.5.gate_proj.weight": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.5.gate_proj.weight_scale": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.5.up_proj.weight": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.5.up_proj.weight_scale": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.50.down_proj.weight": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.50.down_proj.weight_scale": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.50.gate_proj.weight": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.50.gate_proj.weight_scale": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.50.up_proj.weight": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.50.up_proj.weight_scale": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.51.down_proj.weight": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.51.down_proj.weight_scale": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.51.gate_proj.weight": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.51.gate_proj.weight_scale": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.51.up_proj.weight": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.51.up_proj.weight_scale": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.52.down_proj.weight": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.52.down_proj.weight_scale": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.52.gate_proj.weight": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.52.gate_proj.weight_scale": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.52.up_proj.weight": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.52.up_proj.weight_scale": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.53.down_proj.weight": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.53.down_proj.weight_scale": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.53.gate_proj.weight": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.53.gate_proj.weight_scale": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.53.up_proj.weight": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.53.up_proj.weight_scale": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.54.down_proj.weight": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.54.down_proj.weight_scale": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.54.gate_proj.weight": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.54.gate_proj.weight_scale": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.54.up_proj.weight": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.54.up_proj.weight_scale": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.55.down_proj.weight": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.55.down_proj.weight_scale": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.55.gate_proj.weight": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.55.gate_proj.weight_scale": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.55.up_proj.weight": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.55.up_proj.weight_scale": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.56.down_proj.weight": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.56.down_proj.weight_scale": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.56.gate_proj.weight": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.56.gate_proj.weight_scale": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.56.up_proj.weight": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.56.up_proj.weight_scale": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.57.down_proj.weight": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.57.down_proj.weight_scale": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.57.gate_proj.weight": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.57.gate_proj.weight_scale": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.57.up_proj.weight": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.57.up_proj.weight_scale": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.58.down_proj.weight": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.58.down_proj.weight_scale": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.58.gate_proj.weight": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.58.gate_proj.weight_scale": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.58.up_proj.weight": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.58.up_proj.weight_scale": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.59.down_proj.weight": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.59.down_proj.weight_scale": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.59.gate_proj.weight": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.59.gate_proj.weight_scale": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.59.up_proj.weight": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.59.up_proj.weight_scale": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.6.down_proj.weight": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.6.down_proj.weight_scale": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.6.gate_proj.weight": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.6.gate_proj.weight_scale": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.6.up_proj.weight": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.6.up_proj.weight_scale": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.60.down_proj.weight": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.60.down_proj.weight_scale": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.60.gate_proj.weight": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.60.gate_proj.weight_scale": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.60.up_proj.weight": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.60.up_proj.weight_scale": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.61.down_proj.weight": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.61.down_proj.weight_scale": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.61.gate_proj.weight": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.61.gate_proj.weight_scale": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.61.up_proj.weight": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.61.up_proj.weight_scale": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.62.down_proj.weight": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.62.down_proj.weight_scale": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.62.gate_proj.weight": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.62.gate_proj.weight_scale": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.62.up_proj.weight": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.62.up_proj.weight_scale": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.63.down_proj.weight": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.63.down_proj.weight_scale": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.63.gate_proj.weight": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.63.gate_proj.weight_scale": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.63.up_proj.weight": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.63.up_proj.weight_scale": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.64.down_proj.weight": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.64.down_proj.weight_scale": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.64.gate_proj.weight": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.64.gate_proj.weight_scale": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.64.up_proj.weight": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.64.up_proj.weight_scale": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.65.down_proj.weight": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.65.down_proj.weight_scale": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.65.gate_proj.weight": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.65.gate_proj.weight_scale": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.65.up_proj.weight": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.65.up_proj.weight_scale": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.66.down_proj.weight": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.66.down_proj.weight_scale": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.66.gate_proj.weight": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.66.gate_proj.weight_scale": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.66.up_proj.weight": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.66.up_proj.weight_scale": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.67.down_proj.weight": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.67.down_proj.weight_scale": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.67.gate_proj.weight": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.67.gate_proj.weight_scale": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.67.up_proj.weight": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.67.up_proj.weight_scale": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.68.down_proj.weight": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.68.down_proj.weight_scale": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.68.gate_proj.weight": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.68.gate_proj.weight_scale": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.68.up_proj.weight": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.68.up_proj.weight_scale": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.69.down_proj.weight": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.69.down_proj.weight_scale": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.69.gate_proj.weight": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.69.gate_proj.weight_scale": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.69.up_proj.weight": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.69.up_proj.weight_scale": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.7.down_proj.weight": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.7.down_proj.weight_scale": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.7.gate_proj.weight": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.7.gate_proj.weight_scale": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.7.up_proj.weight": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.7.up_proj.weight_scale": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.70.down_proj.weight": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.70.down_proj.weight_scale": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.70.gate_proj.weight": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.70.gate_proj.weight_scale": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.70.up_proj.weight": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.70.up_proj.weight_scale": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.71.down_proj.weight": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.71.down_proj.weight_scale": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.71.gate_proj.weight": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.71.gate_proj.weight_scale": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.71.up_proj.weight": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.71.up_proj.weight_scale": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.72.down_proj.weight": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.72.down_proj.weight_scale": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.72.gate_proj.weight": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.72.gate_proj.weight_scale": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.72.up_proj.weight": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.72.up_proj.weight_scale": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.73.down_proj.weight": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.73.down_proj.weight_scale": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.73.gate_proj.weight": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.73.gate_proj.weight_scale": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.73.up_proj.weight": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.73.up_proj.weight_scale": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.74.down_proj.weight": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.74.down_proj.weight_scale": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.74.gate_proj.weight": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.74.gate_proj.weight_scale": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.74.up_proj.weight": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.74.up_proj.weight_scale": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.75.down_proj.weight": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.75.down_proj.weight_scale": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.75.gate_proj.weight": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.75.gate_proj.weight_scale": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.75.up_proj.weight": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.75.up_proj.weight_scale": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.76.down_proj.weight": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.76.down_proj.weight_scale": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.76.gate_proj.weight": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.76.gate_proj.weight_scale": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.76.up_proj.weight": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.76.up_proj.weight_scale": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.77.down_proj.weight": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.77.down_proj.weight_scale": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.77.gate_proj.weight": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.77.gate_proj.weight_scale": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.77.up_proj.weight": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.77.up_proj.weight_scale": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.78.down_proj.weight": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.78.down_proj.weight_scale": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.78.gate_proj.weight": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.78.gate_proj.weight_scale": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.78.up_proj.weight": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.78.up_proj.weight_scale": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.79.down_proj.weight": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.79.down_proj.weight_scale": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.79.gate_proj.weight": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.79.gate_proj.weight_scale": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.79.up_proj.weight": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.79.up_proj.weight_scale": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.8.down_proj.weight": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.8.down_proj.weight_scale": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.8.gate_proj.weight": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.8.gate_proj.weight_scale": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.8.up_proj.weight": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.8.up_proj.weight_scale": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.80.down_proj.weight": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.80.down_proj.weight_scale": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.80.gate_proj.weight": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.80.gate_proj.weight_scale": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.80.up_proj.weight": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.80.up_proj.weight_scale": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.81.down_proj.weight": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.81.down_proj.weight_scale": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.81.gate_proj.weight": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.81.gate_proj.weight_scale": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.81.up_proj.weight": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.81.up_proj.weight_scale": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.82.down_proj.weight": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.82.down_proj.weight_scale": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.82.gate_proj.weight": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.82.gate_proj.weight_scale": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.82.up_proj.weight": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.82.up_proj.weight_scale": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.83.down_proj.weight": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.83.down_proj.weight_scale": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.83.gate_proj.weight": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.83.gate_proj.weight_scale": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.83.up_proj.weight": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.83.up_proj.weight_scale": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.84.down_proj.weight": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.84.down_proj.weight_scale": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.84.gate_proj.weight": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.84.gate_proj.weight_scale": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.84.up_proj.weight": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.84.up_proj.weight_scale": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.85.down_proj.weight": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.85.down_proj.weight_scale": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.85.gate_proj.weight": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.85.gate_proj.weight_scale": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.85.up_proj.weight": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.85.up_proj.weight_scale": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.86.down_proj.weight": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.86.down_proj.weight_scale": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.86.gate_proj.weight": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.86.gate_proj.weight_scale": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.86.up_proj.weight": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.86.up_proj.weight_scale": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.87.down_proj.weight": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.87.down_proj.weight_scale": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.87.gate_proj.weight": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.87.gate_proj.weight_scale": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.87.up_proj.weight": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.87.up_proj.weight_scale": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.88.down_proj.weight": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.88.down_proj.weight_scale": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.88.gate_proj.weight": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.88.gate_proj.weight_scale": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.88.up_proj.weight": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.88.up_proj.weight_scale": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.89.down_proj.weight": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.89.down_proj.weight_scale": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.89.gate_proj.weight": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.89.gate_proj.weight_scale": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.89.up_proj.weight": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.89.up_proj.weight_scale": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.9.down_proj.weight": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.9.down_proj.weight_scale": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.9.gate_proj.weight": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.9.gate_proj.weight_scale": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.9.up_proj.weight": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.9.up_proj.weight_scale": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.90.down_proj.weight": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.90.down_proj.weight_scale": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.90.gate_proj.weight": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.90.gate_proj.weight_scale": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.90.up_proj.weight": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.90.up_proj.weight_scale": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.91.down_proj.weight": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.91.down_proj.weight_scale": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.91.gate_proj.weight": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.91.gate_proj.weight_scale": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.91.up_proj.weight": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.91.up_proj.weight_scale": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.92.down_proj.weight": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.92.down_proj.weight_scale": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.92.gate_proj.weight": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.92.gate_proj.weight_scale": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.92.up_proj.weight": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.92.up_proj.weight_scale": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.93.down_proj.weight": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.93.down_proj.weight_scale": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.93.gate_proj.weight": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.93.gate_proj.weight_scale": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.93.up_proj.weight": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.93.up_proj.weight_scale": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.94.down_proj.weight": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.94.down_proj.weight_scale": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.94.gate_proj.weight": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.94.gate_proj.weight_scale": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.94.up_proj.weight": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.94.up_proj.weight_scale": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.95.down_proj.weight": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.95.down_proj.weight_scale": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.95.gate_proj.weight": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.95.gate_proj.weight_scale": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.95.up_proj.weight": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.95.up_proj.weight_scale": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.96.down_proj.weight": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.96.down_proj.weight_scale": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.96.gate_proj.weight": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.96.gate_proj.weight_scale": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.96.up_proj.weight": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.96.up_proj.weight_scale": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.97.down_proj.weight": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.97.down_proj.weight_scale": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.97.gate_proj.weight": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.97.gate_proj.weight_scale": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.97.up_proj.weight": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.97.up_proj.weight_scale": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.98.down_proj.weight": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.98.down_proj.weight_scale": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.98.gate_proj.weight": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.98.gate_proj.weight_scale": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.98.up_proj.weight": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.98.up_proj.weight_scale": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.99.down_proj.weight": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.99.down_proj.weight_scale": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.99.gate_proj.weight": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.99.gate_proj.weight_scale": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.99.up_proj.weight": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.99.up_proj.weight_scale": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.gate.e_score_correction_bias": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.gate.weight": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.shared_experts.down_proj.weight": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.shared_experts.down_proj.weight_scale": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.shared_experts.gate_proj.weight": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.shared_experts.gate_proj.weight_scale": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.shared_experts.up_proj.weight": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.shared_experts.up_proj.weight_scale": "model-00074-of-00092.safetensors",
+ "model.layers.73.post_attention_layernorm.weight": "model-00074-of-00092.safetensors",
+ "model.layers.73.self_attn.k_norm.weight": "model-00074-of-00092.safetensors",
+ "model.layers.73.self_attn.k_proj.bias": "model-00074-of-00092.safetensors",
+ "model.layers.73.self_attn.k_proj.weight": "model-00074-of-00092.safetensors",
+ "model.layers.73.self_attn.k_proj.weight_scale": "model-00074-of-00092.safetensors",
+ "model.layers.73.self_attn.o_proj.weight": "model-00074-of-00092.safetensors",
+ "model.layers.73.self_attn.o_proj.weight_scale": "model-00074-of-00092.safetensors",
+ "model.layers.73.self_attn.q_norm.weight": "model-00074-of-00092.safetensors",
+ "model.layers.73.self_attn.q_proj.bias": "model-00074-of-00092.safetensors",
+ "model.layers.73.self_attn.q_proj.weight": "model-00074-of-00092.safetensors",
+ "model.layers.73.self_attn.q_proj.weight_scale": "model-00074-of-00092.safetensors",
+ "model.layers.73.self_attn.v_proj.bias": "model-00074-of-00092.safetensors",
+ "model.layers.73.self_attn.v_proj.weight": "model-00074-of-00092.safetensors",
+ "model.layers.73.self_attn.v_proj.weight_scale": "model-00074-of-00092.safetensors",
+ "model.layers.74.input_layernorm.weight": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.0.down_proj.weight": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.0.down_proj.weight_scale": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.0.gate_proj.weight": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.0.gate_proj.weight_scale": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.0.up_proj.weight": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.0.up_proj.weight_scale": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.1.down_proj.weight": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.1.down_proj.weight_scale": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.1.gate_proj.weight": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.1.gate_proj.weight_scale": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.1.up_proj.weight": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.1.up_proj.weight_scale": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.10.down_proj.weight": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.10.down_proj.weight_scale": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.10.gate_proj.weight": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.10.gate_proj.weight_scale": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.10.up_proj.weight": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.10.up_proj.weight_scale": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.100.down_proj.weight": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.100.down_proj.weight_scale": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.100.gate_proj.weight": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.100.gate_proj.weight_scale": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.100.up_proj.weight": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.100.up_proj.weight_scale": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.101.down_proj.weight": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.101.down_proj.weight_scale": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.101.gate_proj.weight": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.101.gate_proj.weight_scale": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.101.up_proj.weight": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.101.up_proj.weight_scale": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.102.down_proj.weight": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.102.down_proj.weight_scale": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.102.gate_proj.weight": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.102.gate_proj.weight_scale": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.102.up_proj.weight": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.102.up_proj.weight_scale": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.103.down_proj.weight": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.103.down_proj.weight_scale": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.103.gate_proj.weight": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.103.gate_proj.weight_scale": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.103.up_proj.weight": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.103.up_proj.weight_scale": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.104.down_proj.weight": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.104.down_proj.weight_scale": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.104.gate_proj.weight": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.104.gate_proj.weight_scale": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.104.up_proj.weight": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.104.up_proj.weight_scale": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.105.down_proj.weight": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.105.down_proj.weight_scale": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.105.gate_proj.weight": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.105.gate_proj.weight_scale": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.105.up_proj.weight": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.105.up_proj.weight_scale": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.106.down_proj.weight": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.106.down_proj.weight_scale": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.106.gate_proj.weight": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.106.gate_proj.weight_scale": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.106.up_proj.weight": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.106.up_proj.weight_scale": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.107.down_proj.weight": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.107.down_proj.weight_scale": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.107.gate_proj.weight": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.107.gate_proj.weight_scale": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.107.up_proj.weight": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.107.up_proj.weight_scale": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.108.down_proj.weight": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.108.down_proj.weight_scale": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.108.gate_proj.weight": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.108.gate_proj.weight_scale": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.108.up_proj.weight": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.108.up_proj.weight_scale": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.109.down_proj.weight": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.109.down_proj.weight_scale": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.109.gate_proj.weight": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.109.gate_proj.weight_scale": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.109.up_proj.weight": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.109.up_proj.weight_scale": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.11.down_proj.weight": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.11.down_proj.weight_scale": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.11.gate_proj.weight": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.11.gate_proj.weight_scale": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.11.up_proj.weight": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.11.up_proj.weight_scale": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.110.down_proj.weight": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.110.down_proj.weight_scale": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.110.gate_proj.weight": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.110.gate_proj.weight_scale": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.110.up_proj.weight": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.110.up_proj.weight_scale": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.111.down_proj.weight": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.111.down_proj.weight_scale": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.111.gate_proj.weight": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.111.gate_proj.weight_scale": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.111.up_proj.weight": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.111.up_proj.weight_scale": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.112.down_proj.weight": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.112.down_proj.weight_scale": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.112.gate_proj.weight": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.112.gate_proj.weight_scale": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.112.up_proj.weight": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.112.up_proj.weight_scale": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.113.down_proj.weight": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.113.down_proj.weight_scale": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.113.gate_proj.weight": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.113.gate_proj.weight_scale": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.113.up_proj.weight": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.113.up_proj.weight_scale": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.114.down_proj.weight": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.114.down_proj.weight_scale": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.114.gate_proj.weight": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.114.gate_proj.weight_scale": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.114.up_proj.weight": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.114.up_proj.weight_scale": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.115.down_proj.weight": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.115.down_proj.weight_scale": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.115.gate_proj.weight": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.115.gate_proj.weight_scale": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.115.up_proj.weight": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.115.up_proj.weight_scale": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.116.down_proj.weight": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.116.down_proj.weight_scale": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.116.gate_proj.weight": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.116.gate_proj.weight_scale": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.116.up_proj.weight": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.116.up_proj.weight_scale": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.117.down_proj.weight": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.117.down_proj.weight_scale": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.117.gate_proj.weight": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.117.gate_proj.weight_scale": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.117.up_proj.weight": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.117.up_proj.weight_scale": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.118.down_proj.weight": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.118.down_proj.weight_scale": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.118.gate_proj.weight": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.118.gate_proj.weight_scale": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.118.up_proj.weight": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.118.up_proj.weight_scale": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.119.down_proj.weight": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.119.down_proj.weight_scale": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.119.gate_proj.weight": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.119.gate_proj.weight_scale": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.119.up_proj.weight": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.119.up_proj.weight_scale": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.12.down_proj.weight": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.12.down_proj.weight_scale": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.12.gate_proj.weight": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.12.gate_proj.weight_scale": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.12.up_proj.weight": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.12.up_proj.weight_scale": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.120.down_proj.weight": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.120.down_proj.weight_scale": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.120.gate_proj.weight": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.120.gate_proj.weight_scale": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.120.up_proj.weight": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.120.up_proj.weight_scale": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.121.down_proj.weight": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.121.down_proj.weight_scale": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.121.gate_proj.weight": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.121.gate_proj.weight_scale": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.121.up_proj.weight": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.121.up_proj.weight_scale": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.122.down_proj.weight": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.122.down_proj.weight_scale": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.122.gate_proj.weight": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.122.gate_proj.weight_scale": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.122.up_proj.weight": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.122.up_proj.weight_scale": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.123.down_proj.weight": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.123.down_proj.weight_scale": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.123.gate_proj.weight": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.123.gate_proj.weight_scale": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.123.up_proj.weight": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.123.up_proj.weight_scale": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.124.down_proj.weight": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.124.down_proj.weight_scale": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.124.gate_proj.weight": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.124.gate_proj.weight_scale": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.124.up_proj.weight": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.124.up_proj.weight_scale": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.125.down_proj.weight": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.125.down_proj.weight_scale": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.125.gate_proj.weight": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.125.gate_proj.weight_scale": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.125.up_proj.weight": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.125.up_proj.weight_scale": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.126.down_proj.weight": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.126.down_proj.weight_scale": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.126.gate_proj.weight": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.126.gate_proj.weight_scale": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.126.up_proj.weight": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.126.up_proj.weight_scale": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.127.down_proj.weight": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.127.down_proj.weight_scale": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.127.gate_proj.weight": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.127.gate_proj.weight_scale": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.127.up_proj.weight": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.127.up_proj.weight_scale": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.128.down_proj.weight": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.128.down_proj.weight_scale": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.128.gate_proj.weight": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.128.gate_proj.weight_scale": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.128.up_proj.weight": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.128.up_proj.weight_scale": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.129.down_proj.weight": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.129.down_proj.weight_scale": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.129.gate_proj.weight": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.129.gate_proj.weight_scale": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.129.up_proj.weight": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.129.up_proj.weight_scale": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.13.down_proj.weight": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.13.down_proj.weight_scale": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.13.gate_proj.weight": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.13.gate_proj.weight_scale": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.13.up_proj.weight": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.13.up_proj.weight_scale": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.130.down_proj.weight": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.130.down_proj.weight_scale": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.130.gate_proj.weight": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.130.gate_proj.weight_scale": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.130.up_proj.weight": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.130.up_proj.weight_scale": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.131.down_proj.weight": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.131.down_proj.weight_scale": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.131.gate_proj.weight": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.131.gate_proj.weight_scale": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.131.up_proj.weight": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.131.up_proj.weight_scale": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.132.down_proj.weight": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.132.down_proj.weight_scale": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.132.gate_proj.weight": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.132.gate_proj.weight_scale": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.132.up_proj.weight": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.132.up_proj.weight_scale": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.133.down_proj.weight": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.133.down_proj.weight_scale": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.133.gate_proj.weight": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.133.gate_proj.weight_scale": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.133.up_proj.weight": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.133.up_proj.weight_scale": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.134.down_proj.weight": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.134.down_proj.weight_scale": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.134.gate_proj.weight": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.134.gate_proj.weight_scale": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.134.up_proj.weight": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.134.up_proj.weight_scale": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.135.down_proj.weight": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.135.down_proj.weight_scale": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.135.gate_proj.weight": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.135.gate_proj.weight_scale": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.135.up_proj.weight": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.135.up_proj.weight_scale": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.136.down_proj.weight": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.136.down_proj.weight_scale": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.136.gate_proj.weight": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.136.gate_proj.weight_scale": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.136.up_proj.weight": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.136.up_proj.weight_scale": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.137.down_proj.weight": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.137.down_proj.weight_scale": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.137.gate_proj.weight": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.137.gate_proj.weight_scale": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.137.up_proj.weight": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.137.up_proj.weight_scale": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.138.down_proj.weight": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.138.down_proj.weight_scale": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.138.gate_proj.weight": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.138.gate_proj.weight_scale": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.138.up_proj.weight": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.138.up_proj.weight_scale": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.139.down_proj.weight": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.139.down_proj.weight_scale": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.139.gate_proj.weight": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.139.gate_proj.weight_scale": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.139.up_proj.weight": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.139.up_proj.weight_scale": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.14.down_proj.weight": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.14.down_proj.weight_scale": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.14.gate_proj.weight": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.14.gate_proj.weight_scale": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.14.up_proj.weight": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.14.up_proj.weight_scale": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.140.down_proj.weight": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.140.down_proj.weight_scale": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.140.gate_proj.weight": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.140.gate_proj.weight_scale": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.140.up_proj.weight": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.140.up_proj.weight_scale": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.141.down_proj.weight": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.141.down_proj.weight_scale": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.141.gate_proj.weight": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.141.gate_proj.weight_scale": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.141.up_proj.weight": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.141.up_proj.weight_scale": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.142.down_proj.weight": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.142.down_proj.weight_scale": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.142.gate_proj.weight": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.142.gate_proj.weight_scale": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.142.up_proj.weight": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.142.up_proj.weight_scale": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.143.down_proj.weight": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.143.down_proj.weight_scale": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.143.gate_proj.weight": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.143.gate_proj.weight_scale": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.143.up_proj.weight": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.143.up_proj.weight_scale": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.144.down_proj.weight": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.144.down_proj.weight_scale": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.144.gate_proj.weight": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.144.gate_proj.weight_scale": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.144.up_proj.weight": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.144.up_proj.weight_scale": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.145.down_proj.weight": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.145.down_proj.weight_scale": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.145.gate_proj.weight": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.145.gate_proj.weight_scale": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.145.up_proj.weight": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.145.up_proj.weight_scale": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.146.down_proj.weight": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.146.down_proj.weight_scale": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.146.gate_proj.weight": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.146.gate_proj.weight_scale": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.146.up_proj.weight": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.146.up_proj.weight_scale": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.147.down_proj.weight": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.147.down_proj.weight_scale": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.147.gate_proj.weight": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.147.gate_proj.weight_scale": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.147.up_proj.weight": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.147.up_proj.weight_scale": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.148.down_proj.weight": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.148.down_proj.weight_scale": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.148.gate_proj.weight": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.148.gate_proj.weight_scale": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.148.up_proj.weight": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.148.up_proj.weight_scale": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.149.down_proj.weight": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.149.down_proj.weight_scale": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.149.gate_proj.weight": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.149.gate_proj.weight_scale": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.149.up_proj.weight": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.149.up_proj.weight_scale": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.15.down_proj.weight": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.15.down_proj.weight_scale": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.15.gate_proj.weight": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.15.gate_proj.weight_scale": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.15.up_proj.weight": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.15.up_proj.weight_scale": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.150.down_proj.weight": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.150.down_proj.weight_scale": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.150.gate_proj.weight": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.150.gate_proj.weight_scale": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.150.up_proj.weight": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.150.up_proj.weight_scale": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.151.down_proj.weight": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.151.down_proj.weight_scale": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.151.gate_proj.weight": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.151.gate_proj.weight_scale": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.151.up_proj.weight": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.151.up_proj.weight_scale": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.152.down_proj.weight": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.152.down_proj.weight_scale": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.152.gate_proj.weight": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.152.gate_proj.weight_scale": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.152.up_proj.weight": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.152.up_proj.weight_scale": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.153.down_proj.weight": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.153.down_proj.weight_scale": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.153.gate_proj.weight": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.153.gate_proj.weight_scale": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.153.up_proj.weight": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.153.up_proj.weight_scale": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.154.down_proj.weight": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.154.down_proj.weight_scale": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.154.gate_proj.weight": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.154.gate_proj.weight_scale": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.154.up_proj.weight": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.154.up_proj.weight_scale": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.155.down_proj.weight": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.155.down_proj.weight_scale": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.155.gate_proj.weight": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.155.gate_proj.weight_scale": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.155.up_proj.weight": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.155.up_proj.weight_scale": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.156.down_proj.weight": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.156.down_proj.weight_scale": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.156.gate_proj.weight": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.156.gate_proj.weight_scale": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.156.up_proj.weight": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.156.up_proj.weight_scale": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.157.down_proj.weight": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.157.down_proj.weight_scale": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.157.gate_proj.weight": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.157.gate_proj.weight_scale": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.157.up_proj.weight": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.157.up_proj.weight_scale": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.158.down_proj.weight": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.158.down_proj.weight_scale": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.158.gate_proj.weight": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.158.gate_proj.weight_scale": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.158.up_proj.weight": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.158.up_proj.weight_scale": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.159.down_proj.weight": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.159.down_proj.weight_scale": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.159.gate_proj.weight": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.159.gate_proj.weight_scale": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.159.up_proj.weight": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.159.up_proj.weight_scale": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.16.down_proj.weight": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.16.down_proj.weight_scale": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.16.gate_proj.weight": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.16.gate_proj.weight_scale": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.16.up_proj.weight": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.16.up_proj.weight_scale": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.17.down_proj.weight": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.17.down_proj.weight_scale": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.17.gate_proj.weight": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.17.gate_proj.weight_scale": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.17.up_proj.weight": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.17.up_proj.weight_scale": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.18.down_proj.weight": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.18.down_proj.weight_scale": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.18.gate_proj.weight": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.18.gate_proj.weight_scale": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.18.up_proj.weight": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.18.up_proj.weight_scale": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.19.down_proj.weight": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.19.down_proj.weight_scale": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.19.gate_proj.weight": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.19.gate_proj.weight_scale": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.19.up_proj.weight": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.19.up_proj.weight_scale": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.2.down_proj.weight": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.2.down_proj.weight_scale": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.2.gate_proj.weight": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.2.gate_proj.weight_scale": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.2.up_proj.weight": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.2.up_proj.weight_scale": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.20.down_proj.weight": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.20.down_proj.weight_scale": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.20.gate_proj.weight": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.20.gate_proj.weight_scale": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.20.up_proj.weight": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.20.up_proj.weight_scale": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.21.down_proj.weight": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.21.down_proj.weight_scale": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.21.gate_proj.weight": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.21.gate_proj.weight_scale": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.21.up_proj.weight": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.21.up_proj.weight_scale": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.22.down_proj.weight": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.22.down_proj.weight_scale": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.22.gate_proj.weight": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.22.gate_proj.weight_scale": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.22.up_proj.weight": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.22.up_proj.weight_scale": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.23.down_proj.weight": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.23.down_proj.weight_scale": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.23.gate_proj.weight": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.23.gate_proj.weight_scale": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.23.up_proj.weight": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.23.up_proj.weight_scale": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.24.down_proj.weight": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.24.down_proj.weight_scale": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.24.gate_proj.weight": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.24.gate_proj.weight_scale": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.24.up_proj.weight": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.24.up_proj.weight_scale": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.25.down_proj.weight": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.25.down_proj.weight_scale": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.25.gate_proj.weight": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.25.gate_proj.weight_scale": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.25.up_proj.weight": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.25.up_proj.weight_scale": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.26.down_proj.weight": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.26.down_proj.weight_scale": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.26.gate_proj.weight": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.26.gate_proj.weight_scale": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.26.up_proj.weight": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.26.up_proj.weight_scale": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.27.down_proj.weight": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.27.down_proj.weight_scale": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.27.gate_proj.weight": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.27.gate_proj.weight_scale": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.27.up_proj.weight": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.27.up_proj.weight_scale": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.28.down_proj.weight": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.28.down_proj.weight_scale": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.28.gate_proj.weight": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.28.gate_proj.weight_scale": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.28.up_proj.weight": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.28.up_proj.weight_scale": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.29.down_proj.weight": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.29.down_proj.weight_scale": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.29.gate_proj.weight": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.29.gate_proj.weight_scale": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.29.up_proj.weight": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.29.up_proj.weight_scale": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.3.down_proj.weight": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.3.down_proj.weight_scale": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.3.gate_proj.weight": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.3.gate_proj.weight_scale": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.3.up_proj.weight": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.3.up_proj.weight_scale": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.30.down_proj.weight": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.30.down_proj.weight_scale": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.30.gate_proj.weight": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.30.gate_proj.weight_scale": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.30.up_proj.weight": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.30.up_proj.weight_scale": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.31.down_proj.weight": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.31.down_proj.weight_scale": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.31.gate_proj.weight": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.31.gate_proj.weight_scale": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.31.up_proj.weight": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.31.up_proj.weight_scale": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.32.down_proj.weight": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.32.down_proj.weight_scale": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.32.gate_proj.weight": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.32.gate_proj.weight_scale": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.32.up_proj.weight": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.32.up_proj.weight_scale": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.33.down_proj.weight": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.33.down_proj.weight_scale": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.33.gate_proj.weight": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.33.gate_proj.weight_scale": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.33.up_proj.weight": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.33.up_proj.weight_scale": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.34.down_proj.weight": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.34.down_proj.weight_scale": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.34.gate_proj.weight": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.34.gate_proj.weight_scale": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.34.up_proj.weight": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.34.up_proj.weight_scale": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.35.down_proj.weight": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.35.down_proj.weight_scale": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.35.gate_proj.weight": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.35.gate_proj.weight_scale": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.35.up_proj.weight": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.35.up_proj.weight_scale": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.36.down_proj.weight": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.36.down_proj.weight_scale": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.36.gate_proj.weight": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.36.gate_proj.weight_scale": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.36.up_proj.weight": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.36.up_proj.weight_scale": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.37.down_proj.weight": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.37.down_proj.weight_scale": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.37.gate_proj.weight": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.37.gate_proj.weight_scale": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.37.up_proj.weight": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.37.up_proj.weight_scale": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.38.down_proj.weight": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.38.down_proj.weight_scale": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.38.gate_proj.weight": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.38.gate_proj.weight_scale": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.38.up_proj.weight": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.38.up_proj.weight_scale": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.39.down_proj.weight": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.39.down_proj.weight_scale": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.39.gate_proj.weight": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.39.gate_proj.weight_scale": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.39.up_proj.weight": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.39.up_proj.weight_scale": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.4.down_proj.weight": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.4.down_proj.weight_scale": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.4.gate_proj.weight": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.4.gate_proj.weight_scale": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.4.up_proj.weight": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.4.up_proj.weight_scale": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.40.down_proj.weight": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.40.down_proj.weight_scale": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.40.gate_proj.weight": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.40.gate_proj.weight_scale": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.40.up_proj.weight": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.40.up_proj.weight_scale": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.41.down_proj.weight": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.41.down_proj.weight_scale": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.41.gate_proj.weight": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.41.gate_proj.weight_scale": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.41.up_proj.weight": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.41.up_proj.weight_scale": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.42.down_proj.weight": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.42.down_proj.weight_scale": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.42.gate_proj.weight": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.42.gate_proj.weight_scale": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.42.up_proj.weight": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.42.up_proj.weight_scale": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.43.down_proj.weight": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.43.down_proj.weight_scale": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.43.gate_proj.weight": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.43.gate_proj.weight_scale": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.43.up_proj.weight": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.43.up_proj.weight_scale": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.44.down_proj.weight": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.44.down_proj.weight_scale": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.44.gate_proj.weight": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.44.gate_proj.weight_scale": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.44.up_proj.weight": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.44.up_proj.weight_scale": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.45.down_proj.weight": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.45.down_proj.weight_scale": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.45.gate_proj.weight": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.45.gate_proj.weight_scale": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.45.up_proj.weight": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.45.up_proj.weight_scale": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.46.down_proj.weight": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.46.down_proj.weight_scale": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.46.gate_proj.weight": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.46.gate_proj.weight_scale": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.46.up_proj.weight": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.46.up_proj.weight_scale": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.47.down_proj.weight": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.47.down_proj.weight_scale": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.47.gate_proj.weight": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.47.gate_proj.weight_scale": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.47.up_proj.weight": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.47.up_proj.weight_scale": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.48.down_proj.weight": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.48.down_proj.weight_scale": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.48.gate_proj.weight": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.48.gate_proj.weight_scale": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.48.up_proj.weight": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.48.up_proj.weight_scale": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.49.down_proj.weight": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.49.down_proj.weight_scale": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.49.gate_proj.weight": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.49.gate_proj.weight_scale": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.49.up_proj.weight": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.49.up_proj.weight_scale": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.5.down_proj.weight": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.5.down_proj.weight_scale": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.5.gate_proj.weight": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.5.gate_proj.weight_scale": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.5.up_proj.weight": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.5.up_proj.weight_scale": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.50.down_proj.weight": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.50.down_proj.weight_scale": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.50.gate_proj.weight": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.50.gate_proj.weight_scale": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.50.up_proj.weight": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.50.up_proj.weight_scale": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.51.down_proj.weight": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.51.down_proj.weight_scale": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.51.gate_proj.weight": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.51.gate_proj.weight_scale": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.51.up_proj.weight": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.51.up_proj.weight_scale": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.52.down_proj.weight": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.52.down_proj.weight_scale": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.52.gate_proj.weight": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.52.gate_proj.weight_scale": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.52.up_proj.weight": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.52.up_proj.weight_scale": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.53.down_proj.weight": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.53.down_proj.weight_scale": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.53.gate_proj.weight": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.53.gate_proj.weight_scale": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.53.up_proj.weight": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.53.up_proj.weight_scale": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.54.down_proj.weight": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.54.down_proj.weight_scale": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.54.gate_proj.weight": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.54.gate_proj.weight_scale": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.54.up_proj.weight": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.54.up_proj.weight_scale": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.55.down_proj.weight": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.55.down_proj.weight_scale": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.55.gate_proj.weight": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.55.gate_proj.weight_scale": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.55.up_proj.weight": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.55.up_proj.weight_scale": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.56.down_proj.weight": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.56.down_proj.weight_scale": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.56.gate_proj.weight": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.56.gate_proj.weight_scale": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.56.up_proj.weight": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.56.up_proj.weight_scale": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.57.down_proj.weight": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.57.down_proj.weight_scale": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.57.gate_proj.weight": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.57.gate_proj.weight_scale": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.57.up_proj.weight": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.57.up_proj.weight_scale": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.58.down_proj.weight": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.58.down_proj.weight_scale": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.58.gate_proj.weight": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.58.gate_proj.weight_scale": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.58.up_proj.weight": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.58.up_proj.weight_scale": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.59.down_proj.weight": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.59.down_proj.weight_scale": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.59.gate_proj.weight": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.59.gate_proj.weight_scale": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.59.up_proj.weight": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.59.up_proj.weight_scale": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.6.down_proj.weight": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.6.down_proj.weight_scale": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.6.gate_proj.weight": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.6.gate_proj.weight_scale": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.6.up_proj.weight": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.6.up_proj.weight_scale": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.60.down_proj.weight": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.60.down_proj.weight_scale": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.60.gate_proj.weight": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.60.gate_proj.weight_scale": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.60.up_proj.weight": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.60.up_proj.weight_scale": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.61.down_proj.weight": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.61.down_proj.weight_scale": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.61.gate_proj.weight": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.61.gate_proj.weight_scale": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.61.up_proj.weight": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.61.up_proj.weight_scale": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.62.down_proj.weight": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.62.down_proj.weight_scale": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.62.gate_proj.weight": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.62.gate_proj.weight_scale": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.62.up_proj.weight": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.62.up_proj.weight_scale": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.63.down_proj.weight": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.63.down_proj.weight_scale": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.63.gate_proj.weight": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.63.gate_proj.weight_scale": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.63.up_proj.weight": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.63.up_proj.weight_scale": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.64.down_proj.weight": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.64.down_proj.weight_scale": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.64.gate_proj.weight": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.64.gate_proj.weight_scale": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.64.up_proj.weight": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.64.up_proj.weight_scale": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.65.down_proj.weight": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.65.down_proj.weight_scale": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.65.gate_proj.weight": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.65.gate_proj.weight_scale": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.65.up_proj.weight": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.65.up_proj.weight_scale": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.66.down_proj.weight": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.66.down_proj.weight_scale": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.66.gate_proj.weight": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.66.gate_proj.weight_scale": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.66.up_proj.weight": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.66.up_proj.weight_scale": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.67.down_proj.weight": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.67.down_proj.weight_scale": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.67.gate_proj.weight": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.67.gate_proj.weight_scale": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.67.up_proj.weight": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.67.up_proj.weight_scale": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.68.down_proj.weight": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.68.down_proj.weight_scale": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.68.gate_proj.weight": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.68.gate_proj.weight_scale": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.68.up_proj.weight": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.68.up_proj.weight_scale": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.69.down_proj.weight": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.69.down_proj.weight_scale": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.69.gate_proj.weight": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.69.gate_proj.weight_scale": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.69.up_proj.weight": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.69.up_proj.weight_scale": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.7.down_proj.weight": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.7.down_proj.weight_scale": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.7.gate_proj.weight": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.7.gate_proj.weight_scale": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.7.up_proj.weight": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.7.up_proj.weight_scale": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.70.down_proj.weight": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.70.down_proj.weight_scale": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.70.gate_proj.weight": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.70.gate_proj.weight_scale": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.70.up_proj.weight": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.70.up_proj.weight_scale": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.71.down_proj.weight": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.71.down_proj.weight_scale": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.71.gate_proj.weight": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.71.gate_proj.weight_scale": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.71.up_proj.weight": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.71.up_proj.weight_scale": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.72.down_proj.weight": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.72.down_proj.weight_scale": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.72.gate_proj.weight": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.72.gate_proj.weight_scale": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.72.up_proj.weight": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.72.up_proj.weight_scale": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.73.down_proj.weight": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.73.down_proj.weight_scale": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.73.gate_proj.weight": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.73.gate_proj.weight_scale": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.73.up_proj.weight": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.73.up_proj.weight_scale": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.74.down_proj.weight": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.74.down_proj.weight_scale": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.74.gate_proj.weight": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.74.gate_proj.weight_scale": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.74.up_proj.weight": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.74.up_proj.weight_scale": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.75.down_proj.weight": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.75.down_proj.weight_scale": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.75.gate_proj.weight": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.75.gate_proj.weight_scale": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.75.up_proj.weight": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.75.up_proj.weight_scale": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.76.down_proj.weight": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.76.down_proj.weight_scale": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.76.gate_proj.weight": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.76.gate_proj.weight_scale": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.76.up_proj.weight": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.76.up_proj.weight_scale": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.77.down_proj.weight": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.77.down_proj.weight_scale": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.77.gate_proj.weight": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.77.gate_proj.weight_scale": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.77.up_proj.weight": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.77.up_proj.weight_scale": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.78.down_proj.weight": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.78.down_proj.weight_scale": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.78.gate_proj.weight": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.78.gate_proj.weight_scale": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.78.up_proj.weight": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.78.up_proj.weight_scale": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.79.down_proj.weight": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.79.down_proj.weight_scale": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.79.gate_proj.weight": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.79.gate_proj.weight_scale": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.79.up_proj.weight": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.79.up_proj.weight_scale": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.8.down_proj.weight": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.8.down_proj.weight_scale": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.8.gate_proj.weight": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.8.gate_proj.weight_scale": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.8.up_proj.weight": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.8.up_proj.weight_scale": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.80.down_proj.weight": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.80.down_proj.weight_scale": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.80.gate_proj.weight": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.80.gate_proj.weight_scale": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.80.up_proj.weight": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.80.up_proj.weight_scale": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.81.down_proj.weight": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.81.down_proj.weight_scale": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.81.gate_proj.weight": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.81.gate_proj.weight_scale": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.81.up_proj.weight": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.81.up_proj.weight_scale": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.82.down_proj.weight": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.82.down_proj.weight_scale": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.82.gate_proj.weight": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.82.gate_proj.weight_scale": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.82.up_proj.weight": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.82.up_proj.weight_scale": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.83.down_proj.weight": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.83.down_proj.weight_scale": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.83.gate_proj.weight": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.83.gate_proj.weight_scale": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.83.up_proj.weight": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.83.up_proj.weight_scale": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.84.down_proj.weight": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.84.down_proj.weight_scale": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.84.gate_proj.weight": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.84.gate_proj.weight_scale": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.84.up_proj.weight": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.84.up_proj.weight_scale": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.85.down_proj.weight": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.85.down_proj.weight_scale": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.85.gate_proj.weight": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.85.gate_proj.weight_scale": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.85.up_proj.weight": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.85.up_proj.weight_scale": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.86.down_proj.weight": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.86.down_proj.weight_scale": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.86.gate_proj.weight": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.86.gate_proj.weight_scale": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.86.up_proj.weight": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.86.up_proj.weight_scale": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.87.down_proj.weight": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.87.down_proj.weight_scale": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.87.gate_proj.weight": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.87.gate_proj.weight_scale": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.87.up_proj.weight": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.87.up_proj.weight_scale": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.88.down_proj.weight": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.88.down_proj.weight_scale": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.88.gate_proj.weight": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.88.gate_proj.weight_scale": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.88.up_proj.weight": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.88.up_proj.weight_scale": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.89.down_proj.weight": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.89.down_proj.weight_scale": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.89.gate_proj.weight": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.89.gate_proj.weight_scale": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.89.up_proj.weight": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.89.up_proj.weight_scale": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.9.down_proj.weight": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.9.down_proj.weight_scale": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.9.gate_proj.weight": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.9.gate_proj.weight_scale": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.9.up_proj.weight": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.9.up_proj.weight_scale": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.90.down_proj.weight": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.90.down_proj.weight_scale": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.90.gate_proj.weight": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.90.gate_proj.weight_scale": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.90.up_proj.weight": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.90.up_proj.weight_scale": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.91.down_proj.weight": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.91.down_proj.weight_scale": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.91.gate_proj.weight": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.91.gate_proj.weight_scale": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.91.up_proj.weight": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.91.up_proj.weight_scale": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.92.down_proj.weight": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.92.down_proj.weight_scale": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.92.gate_proj.weight": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.92.gate_proj.weight_scale": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.92.up_proj.weight": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.92.up_proj.weight_scale": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.93.down_proj.weight": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.93.down_proj.weight_scale": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.93.gate_proj.weight": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.93.gate_proj.weight_scale": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.93.up_proj.weight": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.93.up_proj.weight_scale": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.94.down_proj.weight": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.94.down_proj.weight_scale": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.94.gate_proj.weight": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.94.gate_proj.weight_scale": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.94.up_proj.weight": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.94.up_proj.weight_scale": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.95.down_proj.weight": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.95.down_proj.weight_scale": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.95.gate_proj.weight": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.95.gate_proj.weight_scale": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.95.up_proj.weight": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.95.up_proj.weight_scale": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.96.down_proj.weight": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.96.down_proj.weight_scale": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.96.gate_proj.weight": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.96.gate_proj.weight_scale": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.96.up_proj.weight": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.96.up_proj.weight_scale": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.97.down_proj.weight": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.97.down_proj.weight_scale": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.97.gate_proj.weight": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.97.gate_proj.weight_scale": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.97.up_proj.weight": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.97.up_proj.weight_scale": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.98.down_proj.weight": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.98.down_proj.weight_scale": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.98.gate_proj.weight": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.98.gate_proj.weight_scale": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.98.up_proj.weight": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.98.up_proj.weight_scale": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.99.down_proj.weight": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.99.down_proj.weight_scale": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.99.gate_proj.weight": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.99.gate_proj.weight_scale": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.99.up_proj.weight": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.99.up_proj.weight_scale": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.gate.e_score_correction_bias": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.gate.weight": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.shared_experts.down_proj.weight": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.shared_experts.down_proj.weight_scale": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.shared_experts.gate_proj.weight": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.shared_experts.gate_proj.weight_scale": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.shared_experts.up_proj.weight": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.shared_experts.up_proj.weight_scale": "model-00075-of-00092.safetensors",
+ "model.layers.74.post_attention_layernorm.weight": "model-00075-of-00092.safetensors",
+ "model.layers.74.self_attn.k_norm.weight": "model-00075-of-00092.safetensors",
+ "model.layers.74.self_attn.k_proj.bias": "model-00075-of-00092.safetensors",
+ "model.layers.74.self_attn.k_proj.weight": "model-00075-of-00092.safetensors",
+ "model.layers.74.self_attn.k_proj.weight_scale": "model-00075-of-00092.safetensors",
+ "model.layers.74.self_attn.o_proj.weight": "model-00075-of-00092.safetensors",
+ "model.layers.74.self_attn.o_proj.weight_scale": "model-00075-of-00092.safetensors",
+ "model.layers.74.self_attn.q_norm.weight": "model-00075-of-00092.safetensors",
+ "model.layers.74.self_attn.q_proj.bias": "model-00075-of-00092.safetensors",
+ "model.layers.74.self_attn.q_proj.weight": "model-00075-of-00092.safetensors",
+ "model.layers.74.self_attn.q_proj.weight_scale": "model-00075-of-00092.safetensors",
+ "model.layers.74.self_attn.v_proj.bias": "model-00075-of-00092.safetensors",
+ "model.layers.74.self_attn.v_proj.weight": "model-00075-of-00092.safetensors",
+ "model.layers.74.self_attn.v_proj.weight_scale": "model-00075-of-00092.safetensors",
+ "model.layers.75.input_layernorm.weight": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.0.down_proj.weight": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.0.down_proj.weight_scale": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.0.gate_proj.weight": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.0.gate_proj.weight_scale": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.0.up_proj.weight": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.0.up_proj.weight_scale": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.1.down_proj.weight": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.1.down_proj.weight_scale": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.1.gate_proj.weight": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.1.gate_proj.weight_scale": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.1.up_proj.weight": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.1.up_proj.weight_scale": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.10.down_proj.weight": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.10.down_proj.weight_scale": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.10.gate_proj.weight": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.10.gate_proj.weight_scale": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.10.up_proj.weight": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.10.up_proj.weight_scale": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.100.down_proj.weight": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.100.down_proj.weight_scale": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.100.gate_proj.weight": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.100.gate_proj.weight_scale": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.100.up_proj.weight": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.100.up_proj.weight_scale": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.101.down_proj.weight": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.101.down_proj.weight_scale": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.101.gate_proj.weight": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.101.gate_proj.weight_scale": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.101.up_proj.weight": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.101.up_proj.weight_scale": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.102.down_proj.weight": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.102.down_proj.weight_scale": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.102.gate_proj.weight": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.102.gate_proj.weight_scale": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.102.up_proj.weight": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.102.up_proj.weight_scale": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.103.down_proj.weight": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.103.down_proj.weight_scale": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.103.gate_proj.weight": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.103.gate_proj.weight_scale": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.103.up_proj.weight": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.103.up_proj.weight_scale": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.104.down_proj.weight": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.104.down_proj.weight_scale": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.104.gate_proj.weight": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.104.gate_proj.weight_scale": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.104.up_proj.weight": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.104.up_proj.weight_scale": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.105.down_proj.weight": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.105.down_proj.weight_scale": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.105.gate_proj.weight": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.105.gate_proj.weight_scale": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.105.up_proj.weight": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.105.up_proj.weight_scale": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.106.down_proj.weight": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.106.down_proj.weight_scale": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.106.gate_proj.weight": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.106.gate_proj.weight_scale": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.106.up_proj.weight": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.106.up_proj.weight_scale": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.107.down_proj.weight": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.107.down_proj.weight_scale": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.107.gate_proj.weight": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.107.gate_proj.weight_scale": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.107.up_proj.weight": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.107.up_proj.weight_scale": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.108.down_proj.weight": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.108.down_proj.weight_scale": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.108.gate_proj.weight": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.108.gate_proj.weight_scale": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.108.up_proj.weight": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.108.up_proj.weight_scale": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.109.down_proj.weight": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.109.down_proj.weight_scale": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.109.gate_proj.weight": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.109.gate_proj.weight_scale": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.109.up_proj.weight": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.109.up_proj.weight_scale": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.11.down_proj.weight": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.11.down_proj.weight_scale": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.11.gate_proj.weight": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.11.gate_proj.weight_scale": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.11.up_proj.weight": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.11.up_proj.weight_scale": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.110.down_proj.weight": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.110.down_proj.weight_scale": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.110.gate_proj.weight": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.110.gate_proj.weight_scale": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.110.up_proj.weight": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.110.up_proj.weight_scale": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.111.down_proj.weight": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.111.down_proj.weight_scale": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.111.gate_proj.weight": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.111.gate_proj.weight_scale": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.111.up_proj.weight": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.111.up_proj.weight_scale": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.112.down_proj.weight": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.112.down_proj.weight_scale": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.112.gate_proj.weight": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.112.gate_proj.weight_scale": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.112.up_proj.weight": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.112.up_proj.weight_scale": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.113.down_proj.weight": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.113.down_proj.weight_scale": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.113.gate_proj.weight": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.113.gate_proj.weight_scale": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.113.up_proj.weight": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.113.up_proj.weight_scale": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.114.down_proj.weight": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.114.down_proj.weight_scale": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.114.gate_proj.weight": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.114.gate_proj.weight_scale": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.114.up_proj.weight": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.114.up_proj.weight_scale": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.115.down_proj.weight": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.115.down_proj.weight_scale": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.115.gate_proj.weight": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.115.gate_proj.weight_scale": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.115.up_proj.weight": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.115.up_proj.weight_scale": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.116.down_proj.weight": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.116.down_proj.weight_scale": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.116.gate_proj.weight": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.116.gate_proj.weight_scale": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.116.up_proj.weight": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.116.up_proj.weight_scale": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.117.down_proj.weight": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.117.down_proj.weight_scale": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.117.gate_proj.weight": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.117.gate_proj.weight_scale": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.117.up_proj.weight": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.117.up_proj.weight_scale": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.118.down_proj.weight": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.118.down_proj.weight_scale": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.118.gate_proj.weight": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.118.gate_proj.weight_scale": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.118.up_proj.weight": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.118.up_proj.weight_scale": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.119.down_proj.weight": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.119.down_proj.weight_scale": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.119.gate_proj.weight": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.119.gate_proj.weight_scale": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.119.up_proj.weight": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.119.up_proj.weight_scale": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.12.down_proj.weight": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.12.down_proj.weight_scale": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.12.gate_proj.weight": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.12.gate_proj.weight_scale": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.12.up_proj.weight": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.12.up_proj.weight_scale": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.120.down_proj.weight": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.120.down_proj.weight_scale": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.120.gate_proj.weight": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.120.gate_proj.weight_scale": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.120.up_proj.weight": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.120.up_proj.weight_scale": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.121.down_proj.weight": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.121.down_proj.weight_scale": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.121.gate_proj.weight": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.121.gate_proj.weight_scale": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.121.up_proj.weight": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.121.up_proj.weight_scale": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.122.down_proj.weight": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.122.down_proj.weight_scale": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.122.gate_proj.weight": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.122.gate_proj.weight_scale": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.122.up_proj.weight": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.122.up_proj.weight_scale": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.123.down_proj.weight": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.123.down_proj.weight_scale": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.123.gate_proj.weight": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.123.gate_proj.weight_scale": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.123.up_proj.weight": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.123.up_proj.weight_scale": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.124.down_proj.weight": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.124.down_proj.weight_scale": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.124.gate_proj.weight": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.124.gate_proj.weight_scale": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.124.up_proj.weight": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.124.up_proj.weight_scale": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.125.down_proj.weight": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.125.down_proj.weight_scale": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.125.gate_proj.weight": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.125.gate_proj.weight_scale": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.125.up_proj.weight": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.125.up_proj.weight_scale": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.126.down_proj.weight": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.126.down_proj.weight_scale": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.126.gate_proj.weight": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.126.gate_proj.weight_scale": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.126.up_proj.weight": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.126.up_proj.weight_scale": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.127.down_proj.weight": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.127.down_proj.weight_scale": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.127.gate_proj.weight": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.127.gate_proj.weight_scale": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.127.up_proj.weight": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.127.up_proj.weight_scale": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.128.down_proj.weight": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.128.down_proj.weight_scale": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.128.gate_proj.weight": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.128.gate_proj.weight_scale": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.128.up_proj.weight": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.128.up_proj.weight_scale": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.129.down_proj.weight": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.129.down_proj.weight_scale": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.129.gate_proj.weight": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.129.gate_proj.weight_scale": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.129.up_proj.weight": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.129.up_proj.weight_scale": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.13.down_proj.weight": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.13.down_proj.weight_scale": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.13.gate_proj.weight": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.13.gate_proj.weight_scale": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.13.up_proj.weight": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.13.up_proj.weight_scale": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.130.down_proj.weight": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.130.down_proj.weight_scale": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.130.gate_proj.weight": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.130.gate_proj.weight_scale": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.130.up_proj.weight": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.130.up_proj.weight_scale": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.131.down_proj.weight": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.131.down_proj.weight_scale": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.131.gate_proj.weight": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.131.gate_proj.weight_scale": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.131.up_proj.weight": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.131.up_proj.weight_scale": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.132.down_proj.weight": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.132.down_proj.weight_scale": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.132.gate_proj.weight": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.132.gate_proj.weight_scale": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.132.up_proj.weight": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.132.up_proj.weight_scale": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.133.down_proj.weight": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.133.down_proj.weight_scale": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.133.gate_proj.weight": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.133.gate_proj.weight_scale": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.133.up_proj.weight": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.133.up_proj.weight_scale": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.134.down_proj.weight": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.134.down_proj.weight_scale": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.134.gate_proj.weight": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.134.gate_proj.weight_scale": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.134.up_proj.weight": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.134.up_proj.weight_scale": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.135.down_proj.weight": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.135.down_proj.weight_scale": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.135.gate_proj.weight": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.135.gate_proj.weight_scale": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.135.up_proj.weight": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.135.up_proj.weight_scale": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.136.down_proj.weight": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.136.down_proj.weight_scale": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.136.gate_proj.weight": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.136.gate_proj.weight_scale": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.136.up_proj.weight": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.136.up_proj.weight_scale": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.137.down_proj.weight": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.137.down_proj.weight_scale": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.137.gate_proj.weight": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.137.gate_proj.weight_scale": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.137.up_proj.weight": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.137.up_proj.weight_scale": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.138.down_proj.weight": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.138.down_proj.weight_scale": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.138.gate_proj.weight": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.138.gate_proj.weight_scale": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.138.up_proj.weight": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.138.up_proj.weight_scale": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.139.down_proj.weight": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.139.down_proj.weight_scale": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.139.gate_proj.weight": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.139.gate_proj.weight_scale": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.139.up_proj.weight": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.139.up_proj.weight_scale": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.14.down_proj.weight": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.14.down_proj.weight_scale": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.14.gate_proj.weight": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.14.gate_proj.weight_scale": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.14.up_proj.weight": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.14.up_proj.weight_scale": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.140.down_proj.weight": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.140.down_proj.weight_scale": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.140.gate_proj.weight": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.140.gate_proj.weight_scale": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.140.up_proj.weight": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.140.up_proj.weight_scale": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.141.down_proj.weight": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.141.down_proj.weight_scale": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.141.gate_proj.weight": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.141.gate_proj.weight_scale": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.141.up_proj.weight": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.141.up_proj.weight_scale": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.142.down_proj.weight": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.142.down_proj.weight_scale": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.142.gate_proj.weight": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.142.gate_proj.weight_scale": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.142.up_proj.weight": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.142.up_proj.weight_scale": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.143.down_proj.weight": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.143.down_proj.weight_scale": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.143.gate_proj.weight": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.143.gate_proj.weight_scale": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.143.up_proj.weight": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.143.up_proj.weight_scale": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.144.down_proj.weight": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.144.down_proj.weight_scale": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.144.gate_proj.weight": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.144.gate_proj.weight_scale": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.144.up_proj.weight": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.144.up_proj.weight_scale": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.145.down_proj.weight": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.145.down_proj.weight_scale": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.145.gate_proj.weight": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.145.gate_proj.weight_scale": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.145.up_proj.weight": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.145.up_proj.weight_scale": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.146.down_proj.weight": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.146.down_proj.weight_scale": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.146.gate_proj.weight": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.146.gate_proj.weight_scale": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.146.up_proj.weight": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.146.up_proj.weight_scale": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.147.down_proj.weight": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.147.down_proj.weight_scale": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.147.gate_proj.weight": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.147.gate_proj.weight_scale": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.147.up_proj.weight": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.147.up_proj.weight_scale": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.148.down_proj.weight": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.148.down_proj.weight_scale": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.148.gate_proj.weight": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.148.gate_proj.weight_scale": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.148.up_proj.weight": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.148.up_proj.weight_scale": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.149.down_proj.weight": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.149.down_proj.weight_scale": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.149.gate_proj.weight": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.149.gate_proj.weight_scale": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.149.up_proj.weight": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.149.up_proj.weight_scale": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.15.down_proj.weight": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.15.down_proj.weight_scale": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.15.gate_proj.weight": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.15.gate_proj.weight_scale": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.15.up_proj.weight": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.15.up_proj.weight_scale": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.150.down_proj.weight": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.150.down_proj.weight_scale": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.150.gate_proj.weight": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.150.gate_proj.weight_scale": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.150.up_proj.weight": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.150.up_proj.weight_scale": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.151.down_proj.weight": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.151.down_proj.weight_scale": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.151.gate_proj.weight": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.151.gate_proj.weight_scale": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.151.up_proj.weight": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.151.up_proj.weight_scale": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.152.down_proj.weight": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.152.down_proj.weight_scale": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.152.gate_proj.weight": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.152.gate_proj.weight_scale": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.152.up_proj.weight": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.152.up_proj.weight_scale": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.153.down_proj.weight": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.153.down_proj.weight_scale": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.153.gate_proj.weight": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.153.gate_proj.weight_scale": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.153.up_proj.weight": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.153.up_proj.weight_scale": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.154.down_proj.weight": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.154.down_proj.weight_scale": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.154.gate_proj.weight": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.154.gate_proj.weight_scale": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.154.up_proj.weight": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.154.up_proj.weight_scale": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.155.down_proj.weight": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.155.down_proj.weight_scale": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.155.gate_proj.weight": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.155.gate_proj.weight_scale": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.155.up_proj.weight": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.155.up_proj.weight_scale": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.156.down_proj.weight": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.156.down_proj.weight_scale": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.156.gate_proj.weight": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.156.gate_proj.weight_scale": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.156.up_proj.weight": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.156.up_proj.weight_scale": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.157.down_proj.weight": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.157.down_proj.weight_scale": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.157.gate_proj.weight": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.157.gate_proj.weight_scale": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.157.up_proj.weight": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.157.up_proj.weight_scale": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.158.down_proj.weight": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.158.down_proj.weight_scale": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.158.gate_proj.weight": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.158.gate_proj.weight_scale": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.158.up_proj.weight": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.158.up_proj.weight_scale": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.159.down_proj.weight": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.159.down_proj.weight_scale": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.159.gate_proj.weight": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.159.gate_proj.weight_scale": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.159.up_proj.weight": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.159.up_proj.weight_scale": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.16.down_proj.weight": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.16.down_proj.weight_scale": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.16.gate_proj.weight": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.16.gate_proj.weight_scale": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.16.up_proj.weight": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.16.up_proj.weight_scale": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.17.down_proj.weight": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.17.down_proj.weight_scale": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.17.gate_proj.weight": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.17.gate_proj.weight_scale": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.17.up_proj.weight": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.17.up_proj.weight_scale": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.18.down_proj.weight": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.18.down_proj.weight_scale": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.18.gate_proj.weight": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.18.gate_proj.weight_scale": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.18.up_proj.weight": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.18.up_proj.weight_scale": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.19.down_proj.weight": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.19.down_proj.weight_scale": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.19.gate_proj.weight": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.19.gate_proj.weight_scale": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.19.up_proj.weight": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.19.up_proj.weight_scale": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.2.down_proj.weight": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.2.down_proj.weight_scale": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.2.gate_proj.weight": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.2.gate_proj.weight_scale": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.2.up_proj.weight": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.2.up_proj.weight_scale": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.20.down_proj.weight": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.20.down_proj.weight_scale": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.20.gate_proj.weight": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.20.gate_proj.weight_scale": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.20.up_proj.weight": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.20.up_proj.weight_scale": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.21.down_proj.weight": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.21.down_proj.weight_scale": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.21.gate_proj.weight": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.21.gate_proj.weight_scale": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.21.up_proj.weight": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.21.up_proj.weight_scale": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.22.down_proj.weight": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.22.down_proj.weight_scale": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.22.gate_proj.weight": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.22.gate_proj.weight_scale": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.22.up_proj.weight": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.22.up_proj.weight_scale": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.23.down_proj.weight": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.23.down_proj.weight_scale": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.23.gate_proj.weight": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.23.gate_proj.weight_scale": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.23.up_proj.weight": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.23.up_proj.weight_scale": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.24.down_proj.weight": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.24.down_proj.weight_scale": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.24.gate_proj.weight": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.24.gate_proj.weight_scale": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.24.up_proj.weight": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.24.up_proj.weight_scale": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.25.down_proj.weight": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.25.down_proj.weight_scale": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.25.gate_proj.weight": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.25.gate_proj.weight_scale": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.25.up_proj.weight": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.25.up_proj.weight_scale": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.26.down_proj.weight": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.26.down_proj.weight_scale": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.26.gate_proj.weight": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.26.gate_proj.weight_scale": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.26.up_proj.weight": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.26.up_proj.weight_scale": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.27.down_proj.weight": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.27.down_proj.weight_scale": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.27.gate_proj.weight": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.27.gate_proj.weight_scale": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.27.up_proj.weight": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.27.up_proj.weight_scale": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.28.down_proj.weight": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.28.down_proj.weight_scale": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.28.gate_proj.weight": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.28.gate_proj.weight_scale": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.28.up_proj.weight": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.28.up_proj.weight_scale": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.29.down_proj.weight": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.29.down_proj.weight_scale": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.29.gate_proj.weight": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.29.gate_proj.weight_scale": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.29.up_proj.weight": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.29.up_proj.weight_scale": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.3.down_proj.weight": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.3.down_proj.weight_scale": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.3.gate_proj.weight": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.3.gate_proj.weight_scale": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.3.up_proj.weight": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.3.up_proj.weight_scale": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.30.down_proj.weight": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.30.down_proj.weight_scale": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.30.gate_proj.weight": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.30.gate_proj.weight_scale": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.30.up_proj.weight": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.30.up_proj.weight_scale": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.31.down_proj.weight": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.31.down_proj.weight_scale": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.31.gate_proj.weight": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.31.gate_proj.weight_scale": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.31.up_proj.weight": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.31.up_proj.weight_scale": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.32.down_proj.weight": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.32.down_proj.weight_scale": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.32.gate_proj.weight": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.32.gate_proj.weight_scale": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.32.up_proj.weight": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.32.up_proj.weight_scale": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.33.down_proj.weight": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.33.down_proj.weight_scale": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.33.gate_proj.weight": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.33.gate_proj.weight_scale": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.33.up_proj.weight": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.33.up_proj.weight_scale": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.34.down_proj.weight": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.34.down_proj.weight_scale": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.34.gate_proj.weight": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.34.gate_proj.weight_scale": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.34.up_proj.weight": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.34.up_proj.weight_scale": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.35.down_proj.weight": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.35.down_proj.weight_scale": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.35.gate_proj.weight": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.35.gate_proj.weight_scale": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.35.up_proj.weight": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.35.up_proj.weight_scale": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.36.down_proj.weight": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.36.down_proj.weight_scale": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.36.gate_proj.weight": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.36.gate_proj.weight_scale": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.36.up_proj.weight": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.36.up_proj.weight_scale": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.37.down_proj.weight": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.37.down_proj.weight_scale": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.37.gate_proj.weight": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.37.gate_proj.weight_scale": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.37.up_proj.weight": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.37.up_proj.weight_scale": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.38.down_proj.weight": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.38.down_proj.weight_scale": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.38.gate_proj.weight": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.38.gate_proj.weight_scale": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.38.up_proj.weight": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.38.up_proj.weight_scale": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.39.down_proj.weight": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.39.down_proj.weight_scale": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.39.gate_proj.weight": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.39.gate_proj.weight_scale": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.39.up_proj.weight": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.39.up_proj.weight_scale": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.4.down_proj.weight": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.4.down_proj.weight_scale": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.4.gate_proj.weight": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.4.gate_proj.weight_scale": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.4.up_proj.weight": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.4.up_proj.weight_scale": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.40.down_proj.weight": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.40.down_proj.weight_scale": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.40.gate_proj.weight": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.40.gate_proj.weight_scale": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.40.up_proj.weight": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.40.up_proj.weight_scale": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.41.down_proj.weight": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.41.down_proj.weight_scale": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.41.gate_proj.weight": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.41.gate_proj.weight_scale": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.41.up_proj.weight": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.41.up_proj.weight_scale": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.42.down_proj.weight": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.42.down_proj.weight_scale": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.42.gate_proj.weight": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.42.gate_proj.weight_scale": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.42.up_proj.weight": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.42.up_proj.weight_scale": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.43.down_proj.weight": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.43.down_proj.weight_scale": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.43.gate_proj.weight": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.43.gate_proj.weight_scale": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.43.up_proj.weight": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.43.up_proj.weight_scale": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.44.down_proj.weight": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.44.down_proj.weight_scale": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.44.gate_proj.weight": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.44.gate_proj.weight_scale": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.44.up_proj.weight": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.44.up_proj.weight_scale": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.45.down_proj.weight": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.45.down_proj.weight_scale": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.45.gate_proj.weight": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.45.gate_proj.weight_scale": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.45.up_proj.weight": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.45.up_proj.weight_scale": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.46.down_proj.weight": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.46.down_proj.weight_scale": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.46.gate_proj.weight": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.46.gate_proj.weight_scale": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.46.up_proj.weight": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.46.up_proj.weight_scale": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.47.down_proj.weight": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.47.down_proj.weight_scale": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.47.gate_proj.weight": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.47.gate_proj.weight_scale": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.47.up_proj.weight": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.47.up_proj.weight_scale": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.48.down_proj.weight": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.48.down_proj.weight_scale": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.48.gate_proj.weight": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.48.gate_proj.weight_scale": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.48.up_proj.weight": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.48.up_proj.weight_scale": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.49.down_proj.weight": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.49.down_proj.weight_scale": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.49.gate_proj.weight": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.49.gate_proj.weight_scale": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.49.up_proj.weight": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.49.up_proj.weight_scale": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.5.down_proj.weight": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.5.down_proj.weight_scale": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.5.gate_proj.weight": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.5.gate_proj.weight_scale": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.5.up_proj.weight": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.5.up_proj.weight_scale": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.50.down_proj.weight": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.50.down_proj.weight_scale": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.50.gate_proj.weight": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.50.gate_proj.weight_scale": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.50.up_proj.weight": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.50.up_proj.weight_scale": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.51.down_proj.weight": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.51.down_proj.weight_scale": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.51.gate_proj.weight": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.51.gate_proj.weight_scale": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.51.up_proj.weight": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.51.up_proj.weight_scale": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.52.down_proj.weight": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.52.down_proj.weight_scale": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.52.gate_proj.weight": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.52.gate_proj.weight_scale": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.52.up_proj.weight": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.52.up_proj.weight_scale": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.53.down_proj.weight": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.53.down_proj.weight_scale": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.53.gate_proj.weight": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.53.gate_proj.weight_scale": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.53.up_proj.weight": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.53.up_proj.weight_scale": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.54.down_proj.weight": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.54.down_proj.weight_scale": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.54.gate_proj.weight": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.54.gate_proj.weight_scale": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.54.up_proj.weight": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.54.up_proj.weight_scale": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.55.down_proj.weight": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.55.down_proj.weight_scale": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.55.gate_proj.weight": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.55.gate_proj.weight_scale": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.55.up_proj.weight": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.55.up_proj.weight_scale": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.56.down_proj.weight": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.56.down_proj.weight_scale": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.56.gate_proj.weight": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.56.gate_proj.weight_scale": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.56.up_proj.weight": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.56.up_proj.weight_scale": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.57.down_proj.weight": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.57.down_proj.weight_scale": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.57.gate_proj.weight": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.57.gate_proj.weight_scale": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.57.up_proj.weight": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.57.up_proj.weight_scale": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.58.down_proj.weight": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.58.down_proj.weight_scale": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.58.gate_proj.weight": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.58.gate_proj.weight_scale": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.58.up_proj.weight": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.58.up_proj.weight_scale": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.59.down_proj.weight": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.59.down_proj.weight_scale": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.59.gate_proj.weight": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.59.gate_proj.weight_scale": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.59.up_proj.weight": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.59.up_proj.weight_scale": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.6.down_proj.weight": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.6.down_proj.weight_scale": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.6.gate_proj.weight": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.6.gate_proj.weight_scale": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.6.up_proj.weight": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.6.up_proj.weight_scale": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.60.down_proj.weight": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.60.down_proj.weight_scale": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.60.gate_proj.weight": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.60.gate_proj.weight_scale": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.60.up_proj.weight": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.60.up_proj.weight_scale": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.61.down_proj.weight": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.61.down_proj.weight_scale": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.61.gate_proj.weight": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.61.gate_proj.weight_scale": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.61.up_proj.weight": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.61.up_proj.weight_scale": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.62.down_proj.weight": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.62.down_proj.weight_scale": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.62.gate_proj.weight": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.62.gate_proj.weight_scale": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.62.up_proj.weight": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.62.up_proj.weight_scale": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.63.down_proj.weight": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.63.down_proj.weight_scale": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.63.gate_proj.weight": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.63.gate_proj.weight_scale": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.63.up_proj.weight": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.63.up_proj.weight_scale": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.64.down_proj.weight": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.64.down_proj.weight_scale": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.64.gate_proj.weight": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.64.gate_proj.weight_scale": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.64.up_proj.weight": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.64.up_proj.weight_scale": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.65.down_proj.weight": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.65.down_proj.weight_scale": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.65.gate_proj.weight": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.65.gate_proj.weight_scale": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.65.up_proj.weight": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.65.up_proj.weight_scale": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.66.down_proj.weight": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.66.down_proj.weight_scale": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.66.gate_proj.weight": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.66.gate_proj.weight_scale": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.66.up_proj.weight": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.66.up_proj.weight_scale": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.67.down_proj.weight": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.67.down_proj.weight_scale": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.67.gate_proj.weight": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.67.gate_proj.weight_scale": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.67.up_proj.weight": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.67.up_proj.weight_scale": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.68.down_proj.weight": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.68.down_proj.weight_scale": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.68.gate_proj.weight": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.68.gate_proj.weight_scale": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.68.up_proj.weight": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.68.up_proj.weight_scale": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.69.down_proj.weight": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.69.down_proj.weight_scale": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.69.gate_proj.weight": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.69.gate_proj.weight_scale": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.69.up_proj.weight": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.69.up_proj.weight_scale": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.7.down_proj.weight": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.7.down_proj.weight_scale": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.7.gate_proj.weight": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.7.gate_proj.weight_scale": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.7.up_proj.weight": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.7.up_proj.weight_scale": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.70.down_proj.weight": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.70.down_proj.weight_scale": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.70.gate_proj.weight": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.70.gate_proj.weight_scale": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.70.up_proj.weight": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.70.up_proj.weight_scale": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.71.down_proj.weight": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.71.down_proj.weight_scale": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.71.gate_proj.weight": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.71.gate_proj.weight_scale": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.71.up_proj.weight": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.71.up_proj.weight_scale": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.72.down_proj.weight": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.72.down_proj.weight_scale": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.72.gate_proj.weight": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.72.gate_proj.weight_scale": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.72.up_proj.weight": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.72.up_proj.weight_scale": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.73.down_proj.weight": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.73.down_proj.weight_scale": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.73.gate_proj.weight": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.73.gate_proj.weight_scale": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.73.up_proj.weight": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.73.up_proj.weight_scale": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.74.down_proj.weight": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.74.down_proj.weight_scale": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.74.gate_proj.weight": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.74.gate_proj.weight_scale": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.74.up_proj.weight": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.74.up_proj.weight_scale": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.75.down_proj.weight": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.75.down_proj.weight_scale": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.75.gate_proj.weight": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.75.gate_proj.weight_scale": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.75.up_proj.weight": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.75.up_proj.weight_scale": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.76.down_proj.weight": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.76.down_proj.weight_scale": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.76.gate_proj.weight": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.76.gate_proj.weight_scale": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.76.up_proj.weight": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.76.up_proj.weight_scale": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.77.down_proj.weight": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.77.down_proj.weight_scale": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.77.gate_proj.weight": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.77.gate_proj.weight_scale": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.77.up_proj.weight": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.77.up_proj.weight_scale": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.78.down_proj.weight": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.78.down_proj.weight_scale": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.78.gate_proj.weight": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.78.gate_proj.weight_scale": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.78.up_proj.weight": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.78.up_proj.weight_scale": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.79.down_proj.weight": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.79.down_proj.weight_scale": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.79.gate_proj.weight": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.79.gate_proj.weight_scale": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.79.up_proj.weight": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.79.up_proj.weight_scale": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.8.down_proj.weight": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.8.down_proj.weight_scale": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.8.gate_proj.weight": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.8.gate_proj.weight_scale": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.8.up_proj.weight": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.8.up_proj.weight_scale": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.80.down_proj.weight": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.80.down_proj.weight_scale": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.80.gate_proj.weight": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.80.gate_proj.weight_scale": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.80.up_proj.weight": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.80.up_proj.weight_scale": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.81.down_proj.weight": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.81.down_proj.weight_scale": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.81.gate_proj.weight": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.81.gate_proj.weight_scale": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.81.up_proj.weight": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.81.up_proj.weight_scale": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.82.down_proj.weight": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.82.down_proj.weight_scale": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.82.gate_proj.weight": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.82.gate_proj.weight_scale": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.82.up_proj.weight": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.82.up_proj.weight_scale": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.83.down_proj.weight": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.83.down_proj.weight_scale": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.83.gate_proj.weight": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.83.gate_proj.weight_scale": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.83.up_proj.weight": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.83.up_proj.weight_scale": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.84.down_proj.weight": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.84.down_proj.weight_scale": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.84.gate_proj.weight": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.84.gate_proj.weight_scale": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.84.up_proj.weight": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.84.up_proj.weight_scale": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.85.down_proj.weight": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.85.down_proj.weight_scale": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.85.gate_proj.weight": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.85.gate_proj.weight_scale": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.85.up_proj.weight": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.85.up_proj.weight_scale": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.86.down_proj.weight": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.86.down_proj.weight_scale": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.86.gate_proj.weight": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.86.gate_proj.weight_scale": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.86.up_proj.weight": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.86.up_proj.weight_scale": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.87.down_proj.weight": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.87.down_proj.weight_scale": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.87.gate_proj.weight": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.87.gate_proj.weight_scale": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.87.up_proj.weight": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.87.up_proj.weight_scale": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.88.down_proj.weight": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.88.down_proj.weight_scale": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.88.gate_proj.weight": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.88.gate_proj.weight_scale": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.88.up_proj.weight": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.88.up_proj.weight_scale": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.89.down_proj.weight": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.89.down_proj.weight_scale": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.89.gate_proj.weight": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.89.gate_proj.weight_scale": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.89.up_proj.weight": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.89.up_proj.weight_scale": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.9.down_proj.weight": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.9.down_proj.weight_scale": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.9.gate_proj.weight": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.9.gate_proj.weight_scale": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.9.up_proj.weight": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.9.up_proj.weight_scale": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.90.down_proj.weight": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.90.down_proj.weight_scale": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.90.gate_proj.weight": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.90.gate_proj.weight_scale": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.90.up_proj.weight": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.90.up_proj.weight_scale": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.91.down_proj.weight": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.91.down_proj.weight_scale": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.91.gate_proj.weight": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.91.gate_proj.weight_scale": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.91.up_proj.weight": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.91.up_proj.weight_scale": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.92.down_proj.weight": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.92.down_proj.weight_scale": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.92.gate_proj.weight": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.92.gate_proj.weight_scale": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.92.up_proj.weight": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.92.up_proj.weight_scale": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.93.down_proj.weight": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.93.down_proj.weight_scale": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.93.gate_proj.weight": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.93.gate_proj.weight_scale": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.93.up_proj.weight": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.93.up_proj.weight_scale": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.94.down_proj.weight": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.94.down_proj.weight_scale": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.94.gate_proj.weight": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.94.gate_proj.weight_scale": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.94.up_proj.weight": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.94.up_proj.weight_scale": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.95.down_proj.weight": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.95.down_proj.weight_scale": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.95.gate_proj.weight": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.95.gate_proj.weight_scale": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.95.up_proj.weight": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.95.up_proj.weight_scale": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.96.down_proj.weight": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.96.down_proj.weight_scale": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.96.gate_proj.weight": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.96.gate_proj.weight_scale": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.96.up_proj.weight": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.96.up_proj.weight_scale": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.97.down_proj.weight": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.97.down_proj.weight_scale": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.97.gate_proj.weight": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.97.gate_proj.weight_scale": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.97.up_proj.weight": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.97.up_proj.weight_scale": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.98.down_proj.weight": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.98.down_proj.weight_scale": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.98.gate_proj.weight": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.98.gate_proj.weight_scale": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.98.up_proj.weight": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.98.up_proj.weight_scale": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.99.down_proj.weight": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.99.down_proj.weight_scale": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.99.gate_proj.weight": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.99.gate_proj.weight_scale": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.99.up_proj.weight": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.99.up_proj.weight_scale": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.gate.e_score_correction_bias": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.gate.weight": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.shared_experts.down_proj.weight": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.shared_experts.down_proj.weight_scale": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.shared_experts.gate_proj.weight": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.shared_experts.gate_proj.weight_scale": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.shared_experts.up_proj.weight": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.shared_experts.up_proj.weight_scale": "model-00076-of-00092.safetensors",
+ "model.layers.75.post_attention_layernorm.weight": "model-00076-of-00092.safetensors",
+ "model.layers.75.self_attn.k_norm.weight": "model-00076-of-00092.safetensors",
+ "model.layers.75.self_attn.k_proj.bias": "model-00076-of-00092.safetensors",
+ "model.layers.75.self_attn.k_proj.weight": "model-00076-of-00092.safetensors",
+ "model.layers.75.self_attn.k_proj.weight_scale": "model-00076-of-00092.safetensors",
+ "model.layers.75.self_attn.o_proj.weight": "model-00076-of-00092.safetensors",
+ "model.layers.75.self_attn.o_proj.weight_scale": "model-00076-of-00092.safetensors",
+ "model.layers.75.self_attn.q_norm.weight": "model-00076-of-00092.safetensors",
+ "model.layers.75.self_attn.q_proj.bias": "model-00076-of-00092.safetensors",
+ "model.layers.75.self_attn.q_proj.weight": "model-00076-of-00092.safetensors",
+ "model.layers.75.self_attn.q_proj.weight_scale": "model-00076-of-00092.safetensors",
+ "model.layers.75.self_attn.v_proj.bias": "model-00076-of-00092.safetensors",
+ "model.layers.75.self_attn.v_proj.weight": "model-00076-of-00092.safetensors",
+ "model.layers.75.self_attn.v_proj.weight_scale": "model-00076-of-00092.safetensors",
+ "model.layers.76.input_layernorm.weight": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.0.down_proj.weight": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.0.down_proj.weight_scale": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.0.gate_proj.weight": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.0.gate_proj.weight_scale": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.0.up_proj.weight": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.0.up_proj.weight_scale": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.1.down_proj.weight": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.1.down_proj.weight_scale": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.1.gate_proj.weight": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.1.gate_proj.weight_scale": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.1.up_proj.weight": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.1.up_proj.weight_scale": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.10.down_proj.weight": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.10.down_proj.weight_scale": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.10.gate_proj.weight": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.10.gate_proj.weight_scale": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.10.up_proj.weight": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.10.up_proj.weight_scale": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.100.down_proj.weight": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.100.down_proj.weight_scale": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.100.gate_proj.weight": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.100.gate_proj.weight_scale": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.100.up_proj.weight": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.100.up_proj.weight_scale": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.101.down_proj.weight": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.101.down_proj.weight_scale": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.101.gate_proj.weight": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.101.gate_proj.weight_scale": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.101.up_proj.weight": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.101.up_proj.weight_scale": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.102.down_proj.weight": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.102.down_proj.weight_scale": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.102.gate_proj.weight": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.102.gate_proj.weight_scale": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.102.up_proj.weight": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.102.up_proj.weight_scale": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.103.down_proj.weight": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.103.down_proj.weight_scale": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.103.gate_proj.weight": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.103.gate_proj.weight_scale": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.103.up_proj.weight": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.103.up_proj.weight_scale": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.104.down_proj.weight": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.104.down_proj.weight_scale": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.104.gate_proj.weight": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.104.gate_proj.weight_scale": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.104.up_proj.weight": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.104.up_proj.weight_scale": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.105.down_proj.weight": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.105.down_proj.weight_scale": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.105.gate_proj.weight": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.105.gate_proj.weight_scale": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.105.up_proj.weight": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.105.up_proj.weight_scale": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.106.down_proj.weight": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.106.down_proj.weight_scale": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.106.gate_proj.weight": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.106.gate_proj.weight_scale": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.106.up_proj.weight": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.106.up_proj.weight_scale": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.107.down_proj.weight": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.107.down_proj.weight_scale": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.107.gate_proj.weight": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.107.gate_proj.weight_scale": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.107.up_proj.weight": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.107.up_proj.weight_scale": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.108.down_proj.weight": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.108.down_proj.weight_scale": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.108.gate_proj.weight": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.108.gate_proj.weight_scale": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.108.up_proj.weight": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.108.up_proj.weight_scale": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.109.down_proj.weight": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.109.down_proj.weight_scale": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.109.gate_proj.weight": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.109.gate_proj.weight_scale": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.109.up_proj.weight": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.109.up_proj.weight_scale": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.11.down_proj.weight": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.11.down_proj.weight_scale": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.11.gate_proj.weight": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.11.gate_proj.weight_scale": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.11.up_proj.weight": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.11.up_proj.weight_scale": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.110.down_proj.weight": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.110.down_proj.weight_scale": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.110.gate_proj.weight": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.110.gate_proj.weight_scale": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.110.up_proj.weight": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.110.up_proj.weight_scale": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.111.down_proj.weight": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.111.down_proj.weight_scale": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.111.gate_proj.weight": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.111.gate_proj.weight_scale": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.111.up_proj.weight": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.111.up_proj.weight_scale": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.112.down_proj.weight": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.112.down_proj.weight_scale": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.112.gate_proj.weight": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.112.gate_proj.weight_scale": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.112.up_proj.weight": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.112.up_proj.weight_scale": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.113.down_proj.weight": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.113.down_proj.weight_scale": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.113.gate_proj.weight": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.113.gate_proj.weight_scale": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.113.up_proj.weight": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.113.up_proj.weight_scale": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.114.down_proj.weight": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.114.down_proj.weight_scale": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.114.gate_proj.weight": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.114.gate_proj.weight_scale": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.114.up_proj.weight": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.114.up_proj.weight_scale": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.115.down_proj.weight": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.115.down_proj.weight_scale": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.115.gate_proj.weight": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.115.gate_proj.weight_scale": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.115.up_proj.weight": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.115.up_proj.weight_scale": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.116.down_proj.weight": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.116.down_proj.weight_scale": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.116.gate_proj.weight": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.116.gate_proj.weight_scale": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.116.up_proj.weight": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.116.up_proj.weight_scale": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.117.down_proj.weight": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.117.down_proj.weight_scale": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.117.gate_proj.weight": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.117.gate_proj.weight_scale": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.117.up_proj.weight": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.117.up_proj.weight_scale": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.118.down_proj.weight": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.118.down_proj.weight_scale": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.118.gate_proj.weight": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.118.gate_proj.weight_scale": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.118.up_proj.weight": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.118.up_proj.weight_scale": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.119.down_proj.weight": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.119.down_proj.weight_scale": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.119.gate_proj.weight": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.119.gate_proj.weight_scale": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.119.up_proj.weight": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.119.up_proj.weight_scale": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.12.down_proj.weight": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.12.down_proj.weight_scale": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.12.gate_proj.weight": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.12.gate_proj.weight_scale": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.12.up_proj.weight": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.12.up_proj.weight_scale": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.120.down_proj.weight": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.120.down_proj.weight_scale": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.120.gate_proj.weight": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.120.gate_proj.weight_scale": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.120.up_proj.weight": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.120.up_proj.weight_scale": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.121.down_proj.weight": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.121.down_proj.weight_scale": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.121.gate_proj.weight": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.121.gate_proj.weight_scale": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.121.up_proj.weight": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.121.up_proj.weight_scale": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.122.down_proj.weight": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.122.down_proj.weight_scale": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.122.gate_proj.weight": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.122.gate_proj.weight_scale": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.122.up_proj.weight": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.122.up_proj.weight_scale": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.123.down_proj.weight": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.123.down_proj.weight_scale": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.123.gate_proj.weight": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.123.gate_proj.weight_scale": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.123.up_proj.weight": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.123.up_proj.weight_scale": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.124.down_proj.weight": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.124.down_proj.weight_scale": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.124.gate_proj.weight": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.124.gate_proj.weight_scale": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.124.up_proj.weight": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.124.up_proj.weight_scale": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.125.down_proj.weight": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.125.down_proj.weight_scale": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.125.gate_proj.weight": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.125.gate_proj.weight_scale": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.125.up_proj.weight": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.125.up_proj.weight_scale": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.126.down_proj.weight": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.126.down_proj.weight_scale": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.126.gate_proj.weight": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.126.gate_proj.weight_scale": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.126.up_proj.weight": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.126.up_proj.weight_scale": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.127.down_proj.weight": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.127.down_proj.weight_scale": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.127.gate_proj.weight": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.127.gate_proj.weight_scale": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.127.up_proj.weight": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.127.up_proj.weight_scale": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.128.down_proj.weight": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.128.down_proj.weight_scale": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.128.gate_proj.weight": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.128.gate_proj.weight_scale": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.128.up_proj.weight": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.128.up_proj.weight_scale": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.129.down_proj.weight": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.129.down_proj.weight_scale": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.129.gate_proj.weight": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.129.gate_proj.weight_scale": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.129.up_proj.weight": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.129.up_proj.weight_scale": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.13.down_proj.weight": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.13.down_proj.weight_scale": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.13.gate_proj.weight": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.13.gate_proj.weight_scale": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.13.up_proj.weight": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.13.up_proj.weight_scale": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.130.down_proj.weight": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.130.down_proj.weight_scale": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.130.gate_proj.weight": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.130.gate_proj.weight_scale": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.130.up_proj.weight": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.130.up_proj.weight_scale": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.131.down_proj.weight": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.131.down_proj.weight_scale": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.131.gate_proj.weight": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.131.gate_proj.weight_scale": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.131.up_proj.weight": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.131.up_proj.weight_scale": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.132.down_proj.weight": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.132.down_proj.weight_scale": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.132.gate_proj.weight": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.132.gate_proj.weight_scale": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.132.up_proj.weight": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.132.up_proj.weight_scale": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.133.down_proj.weight": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.133.down_proj.weight_scale": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.133.gate_proj.weight": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.133.gate_proj.weight_scale": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.133.up_proj.weight": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.133.up_proj.weight_scale": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.134.down_proj.weight": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.134.down_proj.weight_scale": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.134.gate_proj.weight": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.134.gate_proj.weight_scale": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.134.up_proj.weight": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.134.up_proj.weight_scale": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.135.down_proj.weight": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.135.down_proj.weight_scale": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.135.gate_proj.weight": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.135.gate_proj.weight_scale": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.135.up_proj.weight": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.135.up_proj.weight_scale": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.136.down_proj.weight": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.136.down_proj.weight_scale": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.136.gate_proj.weight": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.136.gate_proj.weight_scale": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.136.up_proj.weight": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.136.up_proj.weight_scale": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.137.down_proj.weight": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.137.down_proj.weight_scale": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.137.gate_proj.weight": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.137.gate_proj.weight_scale": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.137.up_proj.weight": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.137.up_proj.weight_scale": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.138.down_proj.weight": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.138.down_proj.weight_scale": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.138.gate_proj.weight": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.138.gate_proj.weight_scale": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.138.up_proj.weight": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.138.up_proj.weight_scale": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.139.down_proj.weight": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.139.down_proj.weight_scale": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.139.gate_proj.weight": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.139.gate_proj.weight_scale": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.139.up_proj.weight": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.139.up_proj.weight_scale": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.14.down_proj.weight": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.14.down_proj.weight_scale": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.14.gate_proj.weight": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.14.gate_proj.weight_scale": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.14.up_proj.weight": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.14.up_proj.weight_scale": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.140.down_proj.weight": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.140.down_proj.weight_scale": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.140.gate_proj.weight": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.140.gate_proj.weight_scale": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.140.up_proj.weight": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.140.up_proj.weight_scale": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.141.down_proj.weight": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.141.down_proj.weight_scale": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.141.gate_proj.weight": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.141.gate_proj.weight_scale": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.141.up_proj.weight": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.141.up_proj.weight_scale": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.142.down_proj.weight": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.142.down_proj.weight_scale": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.142.gate_proj.weight": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.142.gate_proj.weight_scale": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.142.up_proj.weight": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.142.up_proj.weight_scale": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.143.down_proj.weight": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.143.down_proj.weight_scale": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.143.gate_proj.weight": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.143.gate_proj.weight_scale": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.143.up_proj.weight": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.143.up_proj.weight_scale": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.144.down_proj.weight": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.144.down_proj.weight_scale": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.144.gate_proj.weight": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.144.gate_proj.weight_scale": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.144.up_proj.weight": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.144.up_proj.weight_scale": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.145.down_proj.weight": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.145.down_proj.weight_scale": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.145.gate_proj.weight": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.145.gate_proj.weight_scale": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.145.up_proj.weight": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.145.up_proj.weight_scale": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.146.down_proj.weight": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.146.down_proj.weight_scale": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.146.gate_proj.weight": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.146.gate_proj.weight_scale": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.146.up_proj.weight": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.146.up_proj.weight_scale": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.147.down_proj.weight": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.147.down_proj.weight_scale": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.147.gate_proj.weight": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.147.gate_proj.weight_scale": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.147.up_proj.weight": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.147.up_proj.weight_scale": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.148.down_proj.weight": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.148.down_proj.weight_scale": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.148.gate_proj.weight": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.148.gate_proj.weight_scale": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.148.up_proj.weight": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.148.up_proj.weight_scale": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.149.down_proj.weight": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.149.down_proj.weight_scale": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.149.gate_proj.weight": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.149.gate_proj.weight_scale": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.149.up_proj.weight": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.149.up_proj.weight_scale": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.15.down_proj.weight": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.15.down_proj.weight_scale": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.15.gate_proj.weight": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.15.gate_proj.weight_scale": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.15.up_proj.weight": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.15.up_proj.weight_scale": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.150.down_proj.weight": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.150.down_proj.weight_scale": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.150.gate_proj.weight": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.150.gate_proj.weight_scale": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.150.up_proj.weight": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.150.up_proj.weight_scale": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.151.down_proj.weight": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.151.down_proj.weight_scale": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.151.gate_proj.weight": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.151.gate_proj.weight_scale": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.151.up_proj.weight": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.151.up_proj.weight_scale": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.152.down_proj.weight": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.152.down_proj.weight_scale": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.152.gate_proj.weight": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.152.gate_proj.weight_scale": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.152.up_proj.weight": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.152.up_proj.weight_scale": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.153.down_proj.weight": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.153.down_proj.weight_scale": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.153.gate_proj.weight": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.153.gate_proj.weight_scale": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.153.up_proj.weight": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.153.up_proj.weight_scale": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.154.down_proj.weight": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.154.down_proj.weight_scale": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.154.gate_proj.weight": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.154.gate_proj.weight_scale": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.154.up_proj.weight": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.154.up_proj.weight_scale": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.155.down_proj.weight": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.155.down_proj.weight_scale": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.155.gate_proj.weight": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.155.gate_proj.weight_scale": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.155.up_proj.weight": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.155.up_proj.weight_scale": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.156.down_proj.weight": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.156.down_proj.weight_scale": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.156.gate_proj.weight": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.156.gate_proj.weight_scale": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.156.up_proj.weight": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.156.up_proj.weight_scale": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.157.down_proj.weight": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.157.down_proj.weight_scale": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.157.gate_proj.weight": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.157.gate_proj.weight_scale": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.157.up_proj.weight": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.157.up_proj.weight_scale": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.158.down_proj.weight": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.158.down_proj.weight_scale": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.158.gate_proj.weight": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.158.gate_proj.weight_scale": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.158.up_proj.weight": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.158.up_proj.weight_scale": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.159.down_proj.weight": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.159.down_proj.weight_scale": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.159.gate_proj.weight": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.159.gate_proj.weight_scale": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.159.up_proj.weight": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.159.up_proj.weight_scale": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.16.down_proj.weight": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.16.down_proj.weight_scale": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.16.gate_proj.weight": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.16.gate_proj.weight_scale": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.16.up_proj.weight": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.16.up_proj.weight_scale": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.17.down_proj.weight": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.17.down_proj.weight_scale": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.17.gate_proj.weight": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.17.gate_proj.weight_scale": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.17.up_proj.weight": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.17.up_proj.weight_scale": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.18.down_proj.weight": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.18.down_proj.weight_scale": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.18.gate_proj.weight": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.18.gate_proj.weight_scale": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.18.up_proj.weight": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.18.up_proj.weight_scale": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.19.down_proj.weight": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.19.down_proj.weight_scale": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.19.gate_proj.weight": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.19.gate_proj.weight_scale": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.19.up_proj.weight": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.19.up_proj.weight_scale": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.2.down_proj.weight": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.2.down_proj.weight_scale": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.2.gate_proj.weight": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.2.gate_proj.weight_scale": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.2.up_proj.weight": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.2.up_proj.weight_scale": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.20.down_proj.weight": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.20.down_proj.weight_scale": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.20.gate_proj.weight": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.20.gate_proj.weight_scale": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.20.up_proj.weight": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.20.up_proj.weight_scale": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.21.down_proj.weight": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.21.down_proj.weight_scale": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.21.gate_proj.weight": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.21.gate_proj.weight_scale": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.21.up_proj.weight": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.21.up_proj.weight_scale": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.22.down_proj.weight": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.22.down_proj.weight_scale": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.22.gate_proj.weight": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.22.gate_proj.weight_scale": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.22.up_proj.weight": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.22.up_proj.weight_scale": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.23.down_proj.weight": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.23.down_proj.weight_scale": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.23.gate_proj.weight": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.23.gate_proj.weight_scale": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.23.up_proj.weight": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.23.up_proj.weight_scale": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.24.down_proj.weight": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.24.down_proj.weight_scale": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.24.gate_proj.weight": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.24.gate_proj.weight_scale": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.24.up_proj.weight": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.24.up_proj.weight_scale": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.25.down_proj.weight": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.25.down_proj.weight_scale": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.25.gate_proj.weight": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.25.gate_proj.weight_scale": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.25.up_proj.weight": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.25.up_proj.weight_scale": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.26.down_proj.weight": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.26.down_proj.weight_scale": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.26.gate_proj.weight": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.26.gate_proj.weight_scale": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.26.up_proj.weight": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.26.up_proj.weight_scale": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.27.down_proj.weight": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.27.down_proj.weight_scale": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.27.gate_proj.weight": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.27.gate_proj.weight_scale": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.27.up_proj.weight": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.27.up_proj.weight_scale": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.28.down_proj.weight": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.28.down_proj.weight_scale": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.28.gate_proj.weight": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.28.gate_proj.weight_scale": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.28.up_proj.weight": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.28.up_proj.weight_scale": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.29.down_proj.weight": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.29.down_proj.weight_scale": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.29.gate_proj.weight": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.29.gate_proj.weight_scale": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.29.up_proj.weight": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.29.up_proj.weight_scale": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.3.down_proj.weight": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.3.down_proj.weight_scale": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.3.gate_proj.weight": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.3.gate_proj.weight_scale": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.3.up_proj.weight": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.3.up_proj.weight_scale": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.30.down_proj.weight": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.30.down_proj.weight_scale": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.30.gate_proj.weight": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.30.gate_proj.weight_scale": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.30.up_proj.weight": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.30.up_proj.weight_scale": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.31.down_proj.weight": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.31.down_proj.weight_scale": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.31.gate_proj.weight": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.31.gate_proj.weight_scale": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.31.up_proj.weight": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.31.up_proj.weight_scale": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.32.down_proj.weight": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.32.down_proj.weight_scale": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.32.gate_proj.weight": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.32.gate_proj.weight_scale": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.32.up_proj.weight": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.32.up_proj.weight_scale": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.33.down_proj.weight": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.33.down_proj.weight_scale": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.33.gate_proj.weight": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.33.gate_proj.weight_scale": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.33.up_proj.weight": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.33.up_proj.weight_scale": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.34.down_proj.weight": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.34.down_proj.weight_scale": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.34.gate_proj.weight": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.34.gate_proj.weight_scale": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.34.up_proj.weight": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.34.up_proj.weight_scale": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.35.down_proj.weight": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.35.down_proj.weight_scale": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.35.gate_proj.weight": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.35.gate_proj.weight_scale": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.35.up_proj.weight": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.35.up_proj.weight_scale": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.36.down_proj.weight": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.36.down_proj.weight_scale": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.36.gate_proj.weight": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.36.gate_proj.weight_scale": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.36.up_proj.weight": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.36.up_proj.weight_scale": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.37.down_proj.weight": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.37.down_proj.weight_scale": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.37.gate_proj.weight": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.37.gate_proj.weight_scale": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.37.up_proj.weight": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.37.up_proj.weight_scale": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.38.down_proj.weight": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.38.down_proj.weight_scale": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.38.gate_proj.weight": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.38.gate_proj.weight_scale": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.38.up_proj.weight": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.38.up_proj.weight_scale": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.39.down_proj.weight": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.39.down_proj.weight_scale": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.39.gate_proj.weight": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.39.gate_proj.weight_scale": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.39.up_proj.weight": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.39.up_proj.weight_scale": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.4.down_proj.weight": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.4.down_proj.weight_scale": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.4.gate_proj.weight": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.4.gate_proj.weight_scale": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.4.up_proj.weight": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.4.up_proj.weight_scale": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.40.down_proj.weight": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.40.down_proj.weight_scale": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.40.gate_proj.weight": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.40.gate_proj.weight_scale": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.40.up_proj.weight": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.40.up_proj.weight_scale": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.41.down_proj.weight": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.41.down_proj.weight_scale": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.41.gate_proj.weight": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.41.gate_proj.weight_scale": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.41.up_proj.weight": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.41.up_proj.weight_scale": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.42.down_proj.weight": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.42.down_proj.weight_scale": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.42.gate_proj.weight": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.42.gate_proj.weight_scale": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.42.up_proj.weight": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.42.up_proj.weight_scale": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.43.down_proj.weight": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.43.down_proj.weight_scale": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.43.gate_proj.weight": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.43.gate_proj.weight_scale": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.43.up_proj.weight": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.43.up_proj.weight_scale": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.44.down_proj.weight": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.44.down_proj.weight_scale": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.44.gate_proj.weight": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.44.gate_proj.weight_scale": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.44.up_proj.weight": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.44.up_proj.weight_scale": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.45.down_proj.weight": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.45.down_proj.weight_scale": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.45.gate_proj.weight": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.45.gate_proj.weight_scale": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.45.up_proj.weight": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.45.up_proj.weight_scale": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.46.down_proj.weight": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.46.down_proj.weight_scale": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.46.gate_proj.weight": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.46.gate_proj.weight_scale": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.46.up_proj.weight": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.46.up_proj.weight_scale": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.47.down_proj.weight": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.47.down_proj.weight_scale": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.47.gate_proj.weight": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.47.gate_proj.weight_scale": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.47.up_proj.weight": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.47.up_proj.weight_scale": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.48.down_proj.weight": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.48.down_proj.weight_scale": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.48.gate_proj.weight": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.48.gate_proj.weight_scale": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.48.up_proj.weight": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.48.up_proj.weight_scale": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.49.down_proj.weight": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.49.down_proj.weight_scale": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.49.gate_proj.weight": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.49.gate_proj.weight_scale": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.49.up_proj.weight": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.49.up_proj.weight_scale": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.5.down_proj.weight": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.5.down_proj.weight_scale": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.5.gate_proj.weight": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.5.gate_proj.weight_scale": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.5.up_proj.weight": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.5.up_proj.weight_scale": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.50.down_proj.weight": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.50.down_proj.weight_scale": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.50.gate_proj.weight": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.50.gate_proj.weight_scale": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.50.up_proj.weight": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.50.up_proj.weight_scale": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.51.down_proj.weight": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.51.down_proj.weight_scale": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.51.gate_proj.weight": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.51.gate_proj.weight_scale": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.51.up_proj.weight": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.51.up_proj.weight_scale": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.52.down_proj.weight": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.52.down_proj.weight_scale": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.52.gate_proj.weight": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.52.gate_proj.weight_scale": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.52.up_proj.weight": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.52.up_proj.weight_scale": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.53.down_proj.weight": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.53.down_proj.weight_scale": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.53.gate_proj.weight": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.53.gate_proj.weight_scale": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.53.up_proj.weight": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.53.up_proj.weight_scale": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.54.down_proj.weight": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.54.down_proj.weight_scale": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.54.gate_proj.weight": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.54.gate_proj.weight_scale": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.54.up_proj.weight": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.54.up_proj.weight_scale": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.55.down_proj.weight": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.55.down_proj.weight_scale": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.55.gate_proj.weight": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.55.gate_proj.weight_scale": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.55.up_proj.weight": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.55.up_proj.weight_scale": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.56.down_proj.weight": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.56.down_proj.weight_scale": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.56.gate_proj.weight": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.56.gate_proj.weight_scale": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.56.up_proj.weight": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.56.up_proj.weight_scale": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.57.down_proj.weight": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.57.down_proj.weight_scale": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.57.gate_proj.weight": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.57.gate_proj.weight_scale": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.57.up_proj.weight": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.57.up_proj.weight_scale": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.58.down_proj.weight": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.58.down_proj.weight_scale": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.58.gate_proj.weight": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.58.gate_proj.weight_scale": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.58.up_proj.weight": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.58.up_proj.weight_scale": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.59.down_proj.weight": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.59.down_proj.weight_scale": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.59.gate_proj.weight": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.59.gate_proj.weight_scale": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.59.up_proj.weight": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.59.up_proj.weight_scale": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.6.down_proj.weight": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.6.down_proj.weight_scale": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.6.gate_proj.weight": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.6.gate_proj.weight_scale": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.6.up_proj.weight": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.6.up_proj.weight_scale": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.60.down_proj.weight": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.60.down_proj.weight_scale": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.60.gate_proj.weight": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.60.gate_proj.weight_scale": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.60.up_proj.weight": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.60.up_proj.weight_scale": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.61.down_proj.weight": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.61.down_proj.weight_scale": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.61.gate_proj.weight": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.61.gate_proj.weight_scale": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.61.up_proj.weight": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.61.up_proj.weight_scale": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.62.down_proj.weight": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.62.down_proj.weight_scale": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.62.gate_proj.weight": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.62.gate_proj.weight_scale": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.62.up_proj.weight": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.62.up_proj.weight_scale": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.63.down_proj.weight": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.63.down_proj.weight_scale": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.63.gate_proj.weight": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.63.gate_proj.weight_scale": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.63.up_proj.weight": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.63.up_proj.weight_scale": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.64.down_proj.weight": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.64.down_proj.weight_scale": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.64.gate_proj.weight": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.64.gate_proj.weight_scale": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.64.up_proj.weight": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.64.up_proj.weight_scale": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.65.down_proj.weight": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.65.down_proj.weight_scale": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.65.gate_proj.weight": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.65.gate_proj.weight_scale": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.65.up_proj.weight": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.65.up_proj.weight_scale": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.66.down_proj.weight": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.66.down_proj.weight_scale": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.66.gate_proj.weight": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.66.gate_proj.weight_scale": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.66.up_proj.weight": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.66.up_proj.weight_scale": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.67.down_proj.weight": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.67.down_proj.weight_scale": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.67.gate_proj.weight": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.67.gate_proj.weight_scale": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.67.up_proj.weight": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.67.up_proj.weight_scale": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.68.down_proj.weight": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.68.down_proj.weight_scale": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.68.gate_proj.weight": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.68.gate_proj.weight_scale": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.68.up_proj.weight": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.68.up_proj.weight_scale": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.69.down_proj.weight": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.69.down_proj.weight_scale": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.69.gate_proj.weight": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.69.gate_proj.weight_scale": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.69.up_proj.weight": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.69.up_proj.weight_scale": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.7.down_proj.weight": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.7.down_proj.weight_scale": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.7.gate_proj.weight": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.7.gate_proj.weight_scale": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.7.up_proj.weight": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.7.up_proj.weight_scale": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.70.down_proj.weight": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.70.down_proj.weight_scale": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.70.gate_proj.weight": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.70.gate_proj.weight_scale": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.70.up_proj.weight": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.70.up_proj.weight_scale": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.71.down_proj.weight": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.71.down_proj.weight_scale": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.71.gate_proj.weight": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.71.gate_proj.weight_scale": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.71.up_proj.weight": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.71.up_proj.weight_scale": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.72.down_proj.weight": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.72.down_proj.weight_scale": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.72.gate_proj.weight": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.72.gate_proj.weight_scale": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.72.up_proj.weight": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.72.up_proj.weight_scale": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.73.down_proj.weight": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.73.down_proj.weight_scale": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.73.gate_proj.weight": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.73.gate_proj.weight_scale": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.73.up_proj.weight": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.73.up_proj.weight_scale": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.74.down_proj.weight": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.74.down_proj.weight_scale": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.74.gate_proj.weight": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.74.gate_proj.weight_scale": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.74.up_proj.weight": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.74.up_proj.weight_scale": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.75.down_proj.weight": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.75.down_proj.weight_scale": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.75.gate_proj.weight": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.75.gate_proj.weight_scale": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.75.up_proj.weight": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.75.up_proj.weight_scale": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.76.down_proj.weight": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.76.down_proj.weight_scale": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.76.gate_proj.weight": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.76.gate_proj.weight_scale": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.76.up_proj.weight": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.76.up_proj.weight_scale": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.77.down_proj.weight": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.77.down_proj.weight_scale": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.77.gate_proj.weight": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.77.gate_proj.weight_scale": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.77.up_proj.weight": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.77.up_proj.weight_scale": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.78.down_proj.weight": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.78.down_proj.weight_scale": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.78.gate_proj.weight": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.78.gate_proj.weight_scale": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.78.up_proj.weight": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.78.up_proj.weight_scale": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.79.down_proj.weight": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.79.down_proj.weight_scale": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.79.gate_proj.weight": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.79.gate_proj.weight_scale": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.79.up_proj.weight": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.79.up_proj.weight_scale": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.8.down_proj.weight": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.8.down_proj.weight_scale": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.8.gate_proj.weight": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.8.gate_proj.weight_scale": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.8.up_proj.weight": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.8.up_proj.weight_scale": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.80.down_proj.weight": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.80.down_proj.weight_scale": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.80.gate_proj.weight": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.80.gate_proj.weight_scale": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.80.up_proj.weight": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.80.up_proj.weight_scale": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.81.down_proj.weight": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.81.down_proj.weight_scale": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.81.gate_proj.weight": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.81.gate_proj.weight_scale": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.81.up_proj.weight": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.81.up_proj.weight_scale": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.82.down_proj.weight": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.82.down_proj.weight_scale": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.82.gate_proj.weight": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.82.gate_proj.weight_scale": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.82.up_proj.weight": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.82.up_proj.weight_scale": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.83.down_proj.weight": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.83.down_proj.weight_scale": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.83.gate_proj.weight": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.83.gate_proj.weight_scale": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.83.up_proj.weight": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.83.up_proj.weight_scale": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.84.down_proj.weight": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.84.down_proj.weight_scale": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.84.gate_proj.weight": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.84.gate_proj.weight_scale": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.84.up_proj.weight": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.84.up_proj.weight_scale": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.85.down_proj.weight": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.85.down_proj.weight_scale": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.85.gate_proj.weight": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.85.gate_proj.weight_scale": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.85.up_proj.weight": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.85.up_proj.weight_scale": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.86.down_proj.weight": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.86.down_proj.weight_scale": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.86.gate_proj.weight": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.86.gate_proj.weight_scale": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.86.up_proj.weight": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.86.up_proj.weight_scale": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.87.down_proj.weight": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.87.down_proj.weight_scale": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.87.gate_proj.weight": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.87.gate_proj.weight_scale": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.87.up_proj.weight": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.87.up_proj.weight_scale": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.88.down_proj.weight": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.88.down_proj.weight_scale": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.88.gate_proj.weight": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.88.gate_proj.weight_scale": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.88.up_proj.weight": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.88.up_proj.weight_scale": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.89.down_proj.weight": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.89.down_proj.weight_scale": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.89.gate_proj.weight": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.89.gate_proj.weight_scale": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.89.up_proj.weight": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.89.up_proj.weight_scale": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.9.down_proj.weight": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.9.down_proj.weight_scale": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.9.gate_proj.weight": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.9.gate_proj.weight_scale": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.9.up_proj.weight": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.9.up_proj.weight_scale": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.90.down_proj.weight": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.90.down_proj.weight_scale": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.90.gate_proj.weight": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.90.gate_proj.weight_scale": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.90.up_proj.weight": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.90.up_proj.weight_scale": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.91.down_proj.weight": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.91.down_proj.weight_scale": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.91.gate_proj.weight": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.91.gate_proj.weight_scale": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.91.up_proj.weight": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.91.up_proj.weight_scale": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.92.down_proj.weight": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.92.down_proj.weight_scale": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.92.gate_proj.weight": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.92.gate_proj.weight_scale": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.92.up_proj.weight": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.92.up_proj.weight_scale": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.93.down_proj.weight": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.93.down_proj.weight_scale": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.93.gate_proj.weight": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.93.gate_proj.weight_scale": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.93.up_proj.weight": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.93.up_proj.weight_scale": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.94.down_proj.weight": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.94.down_proj.weight_scale": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.94.gate_proj.weight": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.94.gate_proj.weight_scale": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.94.up_proj.weight": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.94.up_proj.weight_scale": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.95.down_proj.weight": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.95.down_proj.weight_scale": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.95.gate_proj.weight": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.95.gate_proj.weight_scale": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.95.up_proj.weight": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.95.up_proj.weight_scale": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.96.down_proj.weight": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.96.down_proj.weight_scale": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.96.gate_proj.weight": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.96.gate_proj.weight_scale": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.96.up_proj.weight": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.96.up_proj.weight_scale": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.97.down_proj.weight": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.97.down_proj.weight_scale": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.97.gate_proj.weight": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.97.gate_proj.weight_scale": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.97.up_proj.weight": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.97.up_proj.weight_scale": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.98.down_proj.weight": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.98.down_proj.weight_scale": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.98.gate_proj.weight": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.98.gate_proj.weight_scale": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.98.up_proj.weight": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.98.up_proj.weight_scale": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.99.down_proj.weight": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.99.down_proj.weight_scale": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.99.gate_proj.weight": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.99.gate_proj.weight_scale": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.99.up_proj.weight": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.99.up_proj.weight_scale": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.gate.e_score_correction_bias": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.gate.weight": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.shared_experts.down_proj.weight": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.shared_experts.down_proj.weight_scale": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.shared_experts.gate_proj.weight": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.shared_experts.gate_proj.weight_scale": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.shared_experts.up_proj.weight": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.shared_experts.up_proj.weight_scale": "model-00077-of-00092.safetensors",
+ "model.layers.76.post_attention_layernorm.weight": "model-00077-of-00092.safetensors",
+ "model.layers.76.self_attn.k_norm.weight": "model-00077-of-00092.safetensors",
+ "model.layers.76.self_attn.k_proj.bias": "model-00077-of-00092.safetensors",
+ "model.layers.76.self_attn.k_proj.weight": "model-00077-of-00092.safetensors",
+ "model.layers.76.self_attn.k_proj.weight_scale": "model-00077-of-00092.safetensors",
+ "model.layers.76.self_attn.o_proj.weight": "model-00077-of-00092.safetensors",
+ "model.layers.76.self_attn.o_proj.weight_scale": "model-00077-of-00092.safetensors",
+ "model.layers.76.self_attn.q_norm.weight": "model-00077-of-00092.safetensors",
+ "model.layers.76.self_attn.q_proj.bias": "model-00077-of-00092.safetensors",
+ "model.layers.76.self_attn.q_proj.weight": "model-00077-of-00092.safetensors",
+ "model.layers.76.self_attn.q_proj.weight_scale": "model-00077-of-00092.safetensors",
+ "model.layers.76.self_attn.v_proj.bias": "model-00077-of-00092.safetensors",
+ "model.layers.76.self_attn.v_proj.weight": "model-00077-of-00092.safetensors",
+ "model.layers.76.self_attn.v_proj.weight_scale": "model-00077-of-00092.safetensors",
+ "model.layers.77.input_layernorm.weight": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.0.down_proj.weight": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.0.down_proj.weight_scale": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.0.gate_proj.weight": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.0.gate_proj.weight_scale": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.0.up_proj.weight": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.0.up_proj.weight_scale": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.1.down_proj.weight": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.1.down_proj.weight_scale": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.1.gate_proj.weight": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.1.gate_proj.weight_scale": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.1.up_proj.weight": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.1.up_proj.weight_scale": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.10.down_proj.weight": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.10.down_proj.weight_scale": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.10.gate_proj.weight": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.10.gate_proj.weight_scale": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.10.up_proj.weight": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.10.up_proj.weight_scale": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.100.down_proj.weight": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.100.down_proj.weight_scale": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.100.gate_proj.weight": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.100.gate_proj.weight_scale": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.100.up_proj.weight": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.100.up_proj.weight_scale": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.101.down_proj.weight": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.101.down_proj.weight_scale": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.101.gate_proj.weight": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.101.gate_proj.weight_scale": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.101.up_proj.weight": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.101.up_proj.weight_scale": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.102.down_proj.weight": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.102.down_proj.weight_scale": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.102.gate_proj.weight": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.102.gate_proj.weight_scale": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.102.up_proj.weight": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.102.up_proj.weight_scale": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.103.down_proj.weight": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.103.down_proj.weight_scale": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.103.gate_proj.weight": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.103.gate_proj.weight_scale": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.103.up_proj.weight": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.103.up_proj.weight_scale": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.104.down_proj.weight": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.104.down_proj.weight_scale": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.104.gate_proj.weight": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.104.gate_proj.weight_scale": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.104.up_proj.weight": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.104.up_proj.weight_scale": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.105.down_proj.weight": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.105.down_proj.weight_scale": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.105.gate_proj.weight": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.105.gate_proj.weight_scale": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.105.up_proj.weight": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.105.up_proj.weight_scale": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.106.down_proj.weight": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.106.down_proj.weight_scale": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.106.gate_proj.weight": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.106.gate_proj.weight_scale": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.106.up_proj.weight": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.106.up_proj.weight_scale": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.107.down_proj.weight": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.107.down_proj.weight_scale": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.107.gate_proj.weight": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.107.gate_proj.weight_scale": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.107.up_proj.weight": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.107.up_proj.weight_scale": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.108.down_proj.weight": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.108.down_proj.weight_scale": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.108.gate_proj.weight": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.108.gate_proj.weight_scale": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.108.up_proj.weight": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.108.up_proj.weight_scale": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.109.down_proj.weight": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.109.down_proj.weight_scale": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.109.gate_proj.weight": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.109.gate_proj.weight_scale": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.109.up_proj.weight": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.109.up_proj.weight_scale": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.11.down_proj.weight": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.11.down_proj.weight_scale": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.11.gate_proj.weight": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.11.gate_proj.weight_scale": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.11.up_proj.weight": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.11.up_proj.weight_scale": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.110.down_proj.weight": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.110.down_proj.weight_scale": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.110.gate_proj.weight": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.110.gate_proj.weight_scale": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.110.up_proj.weight": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.110.up_proj.weight_scale": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.111.down_proj.weight": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.111.down_proj.weight_scale": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.111.gate_proj.weight": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.111.gate_proj.weight_scale": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.111.up_proj.weight": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.111.up_proj.weight_scale": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.112.down_proj.weight": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.112.down_proj.weight_scale": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.112.gate_proj.weight": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.112.gate_proj.weight_scale": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.112.up_proj.weight": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.112.up_proj.weight_scale": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.113.down_proj.weight": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.113.down_proj.weight_scale": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.113.gate_proj.weight": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.113.gate_proj.weight_scale": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.113.up_proj.weight": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.113.up_proj.weight_scale": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.114.down_proj.weight": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.114.down_proj.weight_scale": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.114.gate_proj.weight": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.114.gate_proj.weight_scale": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.114.up_proj.weight": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.114.up_proj.weight_scale": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.115.down_proj.weight": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.115.down_proj.weight_scale": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.115.gate_proj.weight": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.115.gate_proj.weight_scale": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.115.up_proj.weight": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.115.up_proj.weight_scale": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.116.down_proj.weight": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.116.down_proj.weight_scale": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.116.gate_proj.weight": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.116.gate_proj.weight_scale": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.116.up_proj.weight": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.116.up_proj.weight_scale": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.117.down_proj.weight": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.117.down_proj.weight_scale": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.117.gate_proj.weight": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.117.gate_proj.weight_scale": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.117.up_proj.weight": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.117.up_proj.weight_scale": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.118.down_proj.weight": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.118.down_proj.weight_scale": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.118.gate_proj.weight": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.118.gate_proj.weight_scale": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.118.up_proj.weight": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.118.up_proj.weight_scale": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.119.down_proj.weight": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.119.down_proj.weight_scale": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.119.gate_proj.weight": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.119.gate_proj.weight_scale": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.119.up_proj.weight": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.119.up_proj.weight_scale": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.12.down_proj.weight": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.12.down_proj.weight_scale": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.12.gate_proj.weight": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.12.gate_proj.weight_scale": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.12.up_proj.weight": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.12.up_proj.weight_scale": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.120.down_proj.weight": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.120.down_proj.weight_scale": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.120.gate_proj.weight": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.120.gate_proj.weight_scale": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.120.up_proj.weight": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.120.up_proj.weight_scale": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.121.down_proj.weight": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.121.down_proj.weight_scale": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.121.gate_proj.weight": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.121.gate_proj.weight_scale": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.121.up_proj.weight": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.121.up_proj.weight_scale": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.122.down_proj.weight": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.122.down_proj.weight_scale": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.122.gate_proj.weight": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.122.gate_proj.weight_scale": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.122.up_proj.weight": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.122.up_proj.weight_scale": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.123.down_proj.weight": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.123.down_proj.weight_scale": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.123.gate_proj.weight": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.123.gate_proj.weight_scale": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.123.up_proj.weight": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.123.up_proj.weight_scale": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.124.down_proj.weight": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.124.down_proj.weight_scale": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.124.gate_proj.weight": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.124.gate_proj.weight_scale": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.124.up_proj.weight": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.124.up_proj.weight_scale": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.125.down_proj.weight": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.125.down_proj.weight_scale": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.125.gate_proj.weight": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.125.gate_proj.weight_scale": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.125.up_proj.weight": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.125.up_proj.weight_scale": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.126.down_proj.weight": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.126.down_proj.weight_scale": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.126.gate_proj.weight": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.126.gate_proj.weight_scale": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.126.up_proj.weight": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.126.up_proj.weight_scale": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.127.down_proj.weight": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.127.down_proj.weight_scale": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.127.gate_proj.weight": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.127.gate_proj.weight_scale": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.127.up_proj.weight": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.127.up_proj.weight_scale": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.128.down_proj.weight": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.128.down_proj.weight_scale": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.128.gate_proj.weight": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.128.gate_proj.weight_scale": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.128.up_proj.weight": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.128.up_proj.weight_scale": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.129.down_proj.weight": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.129.down_proj.weight_scale": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.129.gate_proj.weight": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.129.gate_proj.weight_scale": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.129.up_proj.weight": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.129.up_proj.weight_scale": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.13.down_proj.weight": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.13.down_proj.weight_scale": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.13.gate_proj.weight": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.13.gate_proj.weight_scale": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.13.up_proj.weight": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.13.up_proj.weight_scale": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.130.down_proj.weight": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.130.down_proj.weight_scale": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.130.gate_proj.weight": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.130.gate_proj.weight_scale": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.130.up_proj.weight": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.130.up_proj.weight_scale": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.131.down_proj.weight": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.131.down_proj.weight_scale": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.131.gate_proj.weight": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.131.gate_proj.weight_scale": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.131.up_proj.weight": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.131.up_proj.weight_scale": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.132.down_proj.weight": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.132.down_proj.weight_scale": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.132.gate_proj.weight": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.132.gate_proj.weight_scale": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.132.up_proj.weight": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.132.up_proj.weight_scale": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.133.down_proj.weight": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.133.down_proj.weight_scale": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.133.gate_proj.weight": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.133.gate_proj.weight_scale": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.133.up_proj.weight": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.133.up_proj.weight_scale": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.134.down_proj.weight": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.134.down_proj.weight_scale": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.134.gate_proj.weight": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.134.gate_proj.weight_scale": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.134.up_proj.weight": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.134.up_proj.weight_scale": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.135.down_proj.weight": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.135.down_proj.weight_scale": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.135.gate_proj.weight": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.135.gate_proj.weight_scale": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.135.up_proj.weight": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.135.up_proj.weight_scale": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.136.down_proj.weight": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.136.down_proj.weight_scale": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.136.gate_proj.weight": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.136.gate_proj.weight_scale": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.136.up_proj.weight": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.136.up_proj.weight_scale": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.137.down_proj.weight": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.137.down_proj.weight_scale": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.137.gate_proj.weight": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.137.gate_proj.weight_scale": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.137.up_proj.weight": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.137.up_proj.weight_scale": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.138.down_proj.weight": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.138.down_proj.weight_scale": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.138.gate_proj.weight": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.138.gate_proj.weight_scale": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.138.up_proj.weight": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.138.up_proj.weight_scale": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.139.down_proj.weight": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.139.down_proj.weight_scale": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.139.gate_proj.weight": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.139.gate_proj.weight_scale": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.139.up_proj.weight": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.139.up_proj.weight_scale": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.14.down_proj.weight": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.14.down_proj.weight_scale": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.14.gate_proj.weight": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.14.gate_proj.weight_scale": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.14.up_proj.weight": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.14.up_proj.weight_scale": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.140.down_proj.weight": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.140.down_proj.weight_scale": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.140.gate_proj.weight": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.140.gate_proj.weight_scale": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.140.up_proj.weight": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.140.up_proj.weight_scale": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.141.down_proj.weight": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.141.down_proj.weight_scale": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.141.gate_proj.weight": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.141.gate_proj.weight_scale": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.141.up_proj.weight": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.141.up_proj.weight_scale": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.142.down_proj.weight": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.142.down_proj.weight_scale": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.142.gate_proj.weight": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.142.gate_proj.weight_scale": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.142.up_proj.weight": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.142.up_proj.weight_scale": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.143.down_proj.weight": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.143.down_proj.weight_scale": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.143.gate_proj.weight": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.143.gate_proj.weight_scale": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.143.up_proj.weight": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.143.up_proj.weight_scale": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.144.down_proj.weight": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.144.down_proj.weight_scale": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.144.gate_proj.weight": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.144.gate_proj.weight_scale": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.144.up_proj.weight": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.144.up_proj.weight_scale": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.145.down_proj.weight": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.145.down_proj.weight_scale": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.145.gate_proj.weight": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.145.gate_proj.weight_scale": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.145.up_proj.weight": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.145.up_proj.weight_scale": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.146.down_proj.weight": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.146.down_proj.weight_scale": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.146.gate_proj.weight": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.146.gate_proj.weight_scale": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.146.up_proj.weight": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.146.up_proj.weight_scale": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.147.down_proj.weight": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.147.down_proj.weight_scale": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.147.gate_proj.weight": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.147.gate_proj.weight_scale": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.147.up_proj.weight": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.147.up_proj.weight_scale": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.148.down_proj.weight": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.148.down_proj.weight_scale": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.148.gate_proj.weight": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.148.gate_proj.weight_scale": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.148.up_proj.weight": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.148.up_proj.weight_scale": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.149.down_proj.weight": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.149.down_proj.weight_scale": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.149.gate_proj.weight": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.149.gate_proj.weight_scale": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.149.up_proj.weight": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.149.up_proj.weight_scale": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.15.down_proj.weight": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.15.down_proj.weight_scale": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.15.gate_proj.weight": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.15.gate_proj.weight_scale": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.15.up_proj.weight": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.15.up_proj.weight_scale": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.150.down_proj.weight": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.150.down_proj.weight_scale": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.150.gate_proj.weight": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.150.gate_proj.weight_scale": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.150.up_proj.weight": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.150.up_proj.weight_scale": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.151.down_proj.weight": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.151.down_proj.weight_scale": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.151.gate_proj.weight": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.151.gate_proj.weight_scale": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.151.up_proj.weight": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.151.up_proj.weight_scale": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.152.down_proj.weight": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.152.down_proj.weight_scale": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.152.gate_proj.weight": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.152.gate_proj.weight_scale": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.152.up_proj.weight": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.152.up_proj.weight_scale": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.153.down_proj.weight": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.153.down_proj.weight_scale": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.153.gate_proj.weight": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.153.gate_proj.weight_scale": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.153.up_proj.weight": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.153.up_proj.weight_scale": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.154.down_proj.weight": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.154.down_proj.weight_scale": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.154.gate_proj.weight": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.154.gate_proj.weight_scale": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.154.up_proj.weight": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.154.up_proj.weight_scale": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.155.down_proj.weight": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.155.down_proj.weight_scale": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.155.gate_proj.weight": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.155.gate_proj.weight_scale": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.155.up_proj.weight": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.155.up_proj.weight_scale": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.156.down_proj.weight": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.156.down_proj.weight_scale": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.156.gate_proj.weight": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.156.gate_proj.weight_scale": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.156.up_proj.weight": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.156.up_proj.weight_scale": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.157.down_proj.weight": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.157.down_proj.weight_scale": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.157.gate_proj.weight": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.157.gate_proj.weight_scale": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.157.up_proj.weight": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.157.up_proj.weight_scale": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.158.down_proj.weight": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.158.down_proj.weight_scale": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.158.gate_proj.weight": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.158.gate_proj.weight_scale": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.158.up_proj.weight": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.158.up_proj.weight_scale": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.159.down_proj.weight": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.159.down_proj.weight_scale": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.159.gate_proj.weight": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.159.gate_proj.weight_scale": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.159.up_proj.weight": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.159.up_proj.weight_scale": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.16.down_proj.weight": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.16.down_proj.weight_scale": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.16.gate_proj.weight": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.16.gate_proj.weight_scale": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.16.up_proj.weight": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.16.up_proj.weight_scale": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.17.down_proj.weight": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.17.down_proj.weight_scale": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.17.gate_proj.weight": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.17.gate_proj.weight_scale": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.17.up_proj.weight": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.17.up_proj.weight_scale": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.18.down_proj.weight": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.18.down_proj.weight_scale": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.18.gate_proj.weight": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.18.gate_proj.weight_scale": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.18.up_proj.weight": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.18.up_proj.weight_scale": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.19.down_proj.weight": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.19.down_proj.weight_scale": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.19.gate_proj.weight": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.19.gate_proj.weight_scale": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.19.up_proj.weight": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.19.up_proj.weight_scale": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.2.down_proj.weight": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.2.down_proj.weight_scale": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.2.gate_proj.weight": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.2.gate_proj.weight_scale": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.2.up_proj.weight": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.2.up_proj.weight_scale": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.20.down_proj.weight": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.20.down_proj.weight_scale": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.20.gate_proj.weight": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.20.gate_proj.weight_scale": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.20.up_proj.weight": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.20.up_proj.weight_scale": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.21.down_proj.weight": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.21.down_proj.weight_scale": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.21.gate_proj.weight": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.21.gate_proj.weight_scale": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.21.up_proj.weight": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.21.up_proj.weight_scale": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.22.down_proj.weight": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.22.down_proj.weight_scale": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.22.gate_proj.weight": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.22.gate_proj.weight_scale": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.22.up_proj.weight": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.22.up_proj.weight_scale": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.23.down_proj.weight": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.23.down_proj.weight_scale": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.23.gate_proj.weight": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.23.gate_proj.weight_scale": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.23.up_proj.weight": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.23.up_proj.weight_scale": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.24.down_proj.weight": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.24.down_proj.weight_scale": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.24.gate_proj.weight": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.24.gate_proj.weight_scale": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.24.up_proj.weight": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.24.up_proj.weight_scale": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.25.down_proj.weight": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.25.down_proj.weight_scale": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.25.gate_proj.weight": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.25.gate_proj.weight_scale": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.25.up_proj.weight": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.25.up_proj.weight_scale": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.26.down_proj.weight": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.26.down_proj.weight_scale": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.26.gate_proj.weight": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.26.gate_proj.weight_scale": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.26.up_proj.weight": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.26.up_proj.weight_scale": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.27.down_proj.weight": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.27.down_proj.weight_scale": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.27.gate_proj.weight": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.27.gate_proj.weight_scale": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.27.up_proj.weight": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.27.up_proj.weight_scale": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.28.down_proj.weight": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.28.down_proj.weight_scale": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.28.gate_proj.weight": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.28.gate_proj.weight_scale": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.28.up_proj.weight": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.28.up_proj.weight_scale": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.29.down_proj.weight": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.29.down_proj.weight_scale": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.29.gate_proj.weight": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.29.gate_proj.weight_scale": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.29.up_proj.weight": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.29.up_proj.weight_scale": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.3.down_proj.weight": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.3.down_proj.weight_scale": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.3.gate_proj.weight": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.3.gate_proj.weight_scale": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.3.up_proj.weight": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.3.up_proj.weight_scale": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.30.down_proj.weight": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.30.down_proj.weight_scale": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.30.gate_proj.weight": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.30.gate_proj.weight_scale": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.30.up_proj.weight": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.30.up_proj.weight_scale": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.31.down_proj.weight": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.31.down_proj.weight_scale": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.31.gate_proj.weight": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.31.gate_proj.weight_scale": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.31.up_proj.weight": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.31.up_proj.weight_scale": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.32.down_proj.weight": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.32.down_proj.weight_scale": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.32.gate_proj.weight": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.32.gate_proj.weight_scale": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.32.up_proj.weight": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.32.up_proj.weight_scale": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.33.down_proj.weight": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.33.down_proj.weight_scale": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.33.gate_proj.weight": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.33.gate_proj.weight_scale": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.33.up_proj.weight": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.33.up_proj.weight_scale": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.34.down_proj.weight": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.34.down_proj.weight_scale": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.34.gate_proj.weight": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.34.gate_proj.weight_scale": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.34.up_proj.weight": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.34.up_proj.weight_scale": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.35.down_proj.weight": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.35.down_proj.weight_scale": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.35.gate_proj.weight": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.35.gate_proj.weight_scale": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.35.up_proj.weight": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.35.up_proj.weight_scale": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.36.down_proj.weight": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.36.down_proj.weight_scale": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.36.gate_proj.weight": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.36.gate_proj.weight_scale": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.36.up_proj.weight": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.36.up_proj.weight_scale": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.37.down_proj.weight": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.37.down_proj.weight_scale": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.37.gate_proj.weight": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.37.gate_proj.weight_scale": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.37.up_proj.weight": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.37.up_proj.weight_scale": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.38.down_proj.weight": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.38.down_proj.weight_scale": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.38.gate_proj.weight": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.38.gate_proj.weight_scale": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.38.up_proj.weight": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.38.up_proj.weight_scale": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.39.down_proj.weight": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.39.down_proj.weight_scale": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.39.gate_proj.weight": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.39.gate_proj.weight_scale": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.39.up_proj.weight": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.39.up_proj.weight_scale": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.4.down_proj.weight": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.4.down_proj.weight_scale": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.4.gate_proj.weight": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.4.gate_proj.weight_scale": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.4.up_proj.weight": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.4.up_proj.weight_scale": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.40.down_proj.weight": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.40.down_proj.weight_scale": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.40.gate_proj.weight": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.40.gate_proj.weight_scale": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.40.up_proj.weight": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.40.up_proj.weight_scale": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.41.down_proj.weight": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.41.down_proj.weight_scale": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.41.gate_proj.weight": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.41.gate_proj.weight_scale": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.41.up_proj.weight": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.41.up_proj.weight_scale": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.42.down_proj.weight": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.42.down_proj.weight_scale": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.42.gate_proj.weight": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.42.gate_proj.weight_scale": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.42.up_proj.weight": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.42.up_proj.weight_scale": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.43.down_proj.weight": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.43.down_proj.weight_scale": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.43.gate_proj.weight": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.43.gate_proj.weight_scale": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.43.up_proj.weight": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.43.up_proj.weight_scale": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.44.down_proj.weight": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.44.down_proj.weight_scale": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.44.gate_proj.weight": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.44.gate_proj.weight_scale": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.44.up_proj.weight": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.44.up_proj.weight_scale": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.45.down_proj.weight": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.45.down_proj.weight_scale": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.45.gate_proj.weight": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.45.gate_proj.weight_scale": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.45.up_proj.weight": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.45.up_proj.weight_scale": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.46.down_proj.weight": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.46.down_proj.weight_scale": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.46.gate_proj.weight": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.46.gate_proj.weight_scale": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.46.up_proj.weight": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.46.up_proj.weight_scale": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.47.down_proj.weight": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.47.down_proj.weight_scale": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.47.gate_proj.weight": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.47.gate_proj.weight_scale": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.47.up_proj.weight": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.47.up_proj.weight_scale": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.48.down_proj.weight": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.48.down_proj.weight_scale": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.48.gate_proj.weight": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.48.gate_proj.weight_scale": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.48.up_proj.weight": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.48.up_proj.weight_scale": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.49.down_proj.weight": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.49.down_proj.weight_scale": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.49.gate_proj.weight": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.49.gate_proj.weight_scale": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.49.up_proj.weight": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.49.up_proj.weight_scale": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.5.down_proj.weight": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.5.down_proj.weight_scale": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.5.gate_proj.weight": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.5.gate_proj.weight_scale": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.5.up_proj.weight": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.5.up_proj.weight_scale": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.50.down_proj.weight": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.50.down_proj.weight_scale": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.50.gate_proj.weight": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.50.gate_proj.weight_scale": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.50.up_proj.weight": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.50.up_proj.weight_scale": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.51.down_proj.weight": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.51.down_proj.weight_scale": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.51.gate_proj.weight": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.51.gate_proj.weight_scale": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.51.up_proj.weight": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.51.up_proj.weight_scale": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.52.down_proj.weight": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.52.down_proj.weight_scale": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.52.gate_proj.weight": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.52.gate_proj.weight_scale": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.52.up_proj.weight": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.52.up_proj.weight_scale": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.53.down_proj.weight": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.53.down_proj.weight_scale": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.53.gate_proj.weight": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.53.gate_proj.weight_scale": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.53.up_proj.weight": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.53.up_proj.weight_scale": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.54.down_proj.weight": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.54.down_proj.weight_scale": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.54.gate_proj.weight": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.54.gate_proj.weight_scale": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.54.up_proj.weight": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.54.up_proj.weight_scale": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.55.down_proj.weight": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.55.down_proj.weight_scale": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.55.gate_proj.weight": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.55.gate_proj.weight_scale": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.55.up_proj.weight": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.55.up_proj.weight_scale": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.56.down_proj.weight": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.56.down_proj.weight_scale": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.56.gate_proj.weight": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.56.gate_proj.weight_scale": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.56.up_proj.weight": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.56.up_proj.weight_scale": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.57.down_proj.weight": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.57.down_proj.weight_scale": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.57.gate_proj.weight": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.57.gate_proj.weight_scale": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.57.up_proj.weight": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.57.up_proj.weight_scale": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.58.down_proj.weight": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.58.down_proj.weight_scale": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.58.gate_proj.weight": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.58.gate_proj.weight_scale": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.58.up_proj.weight": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.58.up_proj.weight_scale": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.59.down_proj.weight": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.59.down_proj.weight_scale": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.59.gate_proj.weight": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.59.gate_proj.weight_scale": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.59.up_proj.weight": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.59.up_proj.weight_scale": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.6.down_proj.weight": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.6.down_proj.weight_scale": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.6.gate_proj.weight": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.6.gate_proj.weight_scale": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.6.up_proj.weight": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.6.up_proj.weight_scale": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.60.down_proj.weight": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.60.down_proj.weight_scale": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.60.gate_proj.weight": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.60.gate_proj.weight_scale": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.60.up_proj.weight": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.60.up_proj.weight_scale": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.61.down_proj.weight": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.61.down_proj.weight_scale": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.61.gate_proj.weight": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.61.gate_proj.weight_scale": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.61.up_proj.weight": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.61.up_proj.weight_scale": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.62.down_proj.weight": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.62.down_proj.weight_scale": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.62.gate_proj.weight": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.62.gate_proj.weight_scale": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.62.up_proj.weight": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.62.up_proj.weight_scale": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.63.down_proj.weight": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.63.down_proj.weight_scale": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.63.gate_proj.weight": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.63.gate_proj.weight_scale": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.63.up_proj.weight": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.63.up_proj.weight_scale": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.64.down_proj.weight": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.64.down_proj.weight_scale": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.64.gate_proj.weight": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.64.gate_proj.weight_scale": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.64.up_proj.weight": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.64.up_proj.weight_scale": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.65.down_proj.weight": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.65.down_proj.weight_scale": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.65.gate_proj.weight": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.65.gate_proj.weight_scale": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.65.up_proj.weight": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.65.up_proj.weight_scale": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.66.down_proj.weight": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.66.down_proj.weight_scale": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.66.gate_proj.weight": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.66.gate_proj.weight_scale": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.66.up_proj.weight": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.66.up_proj.weight_scale": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.67.down_proj.weight": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.67.down_proj.weight_scale": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.67.gate_proj.weight": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.67.gate_proj.weight_scale": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.67.up_proj.weight": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.67.up_proj.weight_scale": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.68.down_proj.weight": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.68.down_proj.weight_scale": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.68.gate_proj.weight": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.68.gate_proj.weight_scale": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.68.up_proj.weight": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.68.up_proj.weight_scale": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.69.down_proj.weight": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.69.down_proj.weight_scale": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.69.gate_proj.weight": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.69.gate_proj.weight_scale": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.69.up_proj.weight": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.69.up_proj.weight_scale": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.7.down_proj.weight": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.7.down_proj.weight_scale": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.7.gate_proj.weight": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.7.gate_proj.weight_scale": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.7.up_proj.weight": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.7.up_proj.weight_scale": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.70.down_proj.weight": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.70.down_proj.weight_scale": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.70.gate_proj.weight": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.70.gate_proj.weight_scale": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.70.up_proj.weight": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.70.up_proj.weight_scale": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.71.down_proj.weight": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.71.down_proj.weight_scale": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.71.gate_proj.weight": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.71.gate_proj.weight_scale": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.71.up_proj.weight": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.71.up_proj.weight_scale": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.72.down_proj.weight": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.72.down_proj.weight_scale": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.72.gate_proj.weight": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.72.gate_proj.weight_scale": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.72.up_proj.weight": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.72.up_proj.weight_scale": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.73.down_proj.weight": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.73.down_proj.weight_scale": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.73.gate_proj.weight": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.73.gate_proj.weight_scale": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.73.up_proj.weight": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.73.up_proj.weight_scale": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.74.down_proj.weight": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.74.down_proj.weight_scale": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.74.gate_proj.weight": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.74.gate_proj.weight_scale": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.74.up_proj.weight": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.74.up_proj.weight_scale": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.75.down_proj.weight": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.75.down_proj.weight_scale": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.75.gate_proj.weight": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.75.gate_proj.weight_scale": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.75.up_proj.weight": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.75.up_proj.weight_scale": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.76.down_proj.weight": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.76.down_proj.weight_scale": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.76.gate_proj.weight": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.76.gate_proj.weight_scale": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.76.up_proj.weight": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.76.up_proj.weight_scale": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.77.down_proj.weight": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.77.down_proj.weight_scale": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.77.gate_proj.weight": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.77.gate_proj.weight_scale": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.77.up_proj.weight": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.77.up_proj.weight_scale": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.78.down_proj.weight": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.78.down_proj.weight_scale": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.78.gate_proj.weight": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.78.gate_proj.weight_scale": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.78.up_proj.weight": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.78.up_proj.weight_scale": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.79.down_proj.weight": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.79.down_proj.weight_scale": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.79.gate_proj.weight": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.79.gate_proj.weight_scale": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.79.up_proj.weight": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.79.up_proj.weight_scale": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.8.down_proj.weight": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.8.down_proj.weight_scale": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.8.gate_proj.weight": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.8.gate_proj.weight_scale": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.8.up_proj.weight": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.8.up_proj.weight_scale": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.80.down_proj.weight": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.80.down_proj.weight_scale": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.80.gate_proj.weight": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.80.gate_proj.weight_scale": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.80.up_proj.weight": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.80.up_proj.weight_scale": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.81.down_proj.weight": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.81.down_proj.weight_scale": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.81.gate_proj.weight": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.81.gate_proj.weight_scale": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.81.up_proj.weight": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.81.up_proj.weight_scale": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.82.down_proj.weight": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.82.down_proj.weight_scale": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.82.gate_proj.weight": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.82.gate_proj.weight_scale": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.82.up_proj.weight": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.82.up_proj.weight_scale": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.83.down_proj.weight": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.83.down_proj.weight_scale": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.83.gate_proj.weight": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.83.gate_proj.weight_scale": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.83.up_proj.weight": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.83.up_proj.weight_scale": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.84.down_proj.weight": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.84.down_proj.weight_scale": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.84.gate_proj.weight": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.84.gate_proj.weight_scale": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.84.up_proj.weight": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.84.up_proj.weight_scale": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.85.down_proj.weight": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.85.down_proj.weight_scale": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.85.gate_proj.weight": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.85.gate_proj.weight_scale": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.85.up_proj.weight": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.85.up_proj.weight_scale": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.86.down_proj.weight": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.86.down_proj.weight_scale": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.86.gate_proj.weight": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.86.gate_proj.weight_scale": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.86.up_proj.weight": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.86.up_proj.weight_scale": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.87.down_proj.weight": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.87.down_proj.weight_scale": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.87.gate_proj.weight": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.87.gate_proj.weight_scale": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.87.up_proj.weight": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.87.up_proj.weight_scale": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.88.down_proj.weight": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.88.down_proj.weight_scale": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.88.gate_proj.weight": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.88.gate_proj.weight_scale": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.88.up_proj.weight": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.88.up_proj.weight_scale": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.89.down_proj.weight": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.89.down_proj.weight_scale": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.89.gate_proj.weight": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.89.gate_proj.weight_scale": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.89.up_proj.weight": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.89.up_proj.weight_scale": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.9.down_proj.weight": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.9.down_proj.weight_scale": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.9.gate_proj.weight": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.9.gate_proj.weight_scale": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.9.up_proj.weight": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.9.up_proj.weight_scale": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.90.down_proj.weight": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.90.down_proj.weight_scale": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.90.gate_proj.weight": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.90.gate_proj.weight_scale": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.90.up_proj.weight": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.90.up_proj.weight_scale": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.91.down_proj.weight": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.91.down_proj.weight_scale": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.91.gate_proj.weight": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.91.gate_proj.weight_scale": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.91.up_proj.weight": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.91.up_proj.weight_scale": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.92.down_proj.weight": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.92.down_proj.weight_scale": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.92.gate_proj.weight": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.92.gate_proj.weight_scale": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.92.up_proj.weight": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.92.up_proj.weight_scale": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.93.down_proj.weight": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.93.down_proj.weight_scale": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.93.gate_proj.weight": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.93.gate_proj.weight_scale": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.93.up_proj.weight": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.93.up_proj.weight_scale": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.94.down_proj.weight": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.94.down_proj.weight_scale": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.94.gate_proj.weight": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.94.gate_proj.weight_scale": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.94.up_proj.weight": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.94.up_proj.weight_scale": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.95.down_proj.weight": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.95.down_proj.weight_scale": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.95.gate_proj.weight": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.95.gate_proj.weight_scale": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.95.up_proj.weight": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.95.up_proj.weight_scale": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.96.down_proj.weight": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.96.down_proj.weight_scale": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.96.gate_proj.weight": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.96.gate_proj.weight_scale": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.96.up_proj.weight": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.96.up_proj.weight_scale": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.97.down_proj.weight": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.97.down_proj.weight_scale": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.97.gate_proj.weight": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.97.gate_proj.weight_scale": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.97.up_proj.weight": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.97.up_proj.weight_scale": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.98.down_proj.weight": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.98.down_proj.weight_scale": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.98.gate_proj.weight": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.98.gate_proj.weight_scale": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.98.up_proj.weight": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.98.up_proj.weight_scale": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.99.down_proj.weight": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.99.down_proj.weight_scale": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.99.gate_proj.weight": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.99.gate_proj.weight_scale": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.99.up_proj.weight": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.99.up_proj.weight_scale": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.gate.e_score_correction_bias": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.gate.weight": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.shared_experts.down_proj.weight": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.shared_experts.down_proj.weight_scale": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.shared_experts.gate_proj.weight": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.shared_experts.gate_proj.weight_scale": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.shared_experts.up_proj.weight": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.shared_experts.up_proj.weight_scale": "model-00078-of-00092.safetensors",
+ "model.layers.77.post_attention_layernorm.weight": "model-00078-of-00092.safetensors",
+ "model.layers.77.self_attn.k_norm.weight": "model-00078-of-00092.safetensors",
+ "model.layers.77.self_attn.k_proj.bias": "model-00078-of-00092.safetensors",
+ "model.layers.77.self_attn.k_proj.weight": "model-00078-of-00092.safetensors",
+ "model.layers.77.self_attn.k_proj.weight_scale": "model-00078-of-00092.safetensors",
+ "model.layers.77.self_attn.o_proj.weight": "model-00078-of-00092.safetensors",
+ "model.layers.77.self_attn.o_proj.weight_scale": "model-00078-of-00092.safetensors",
+ "model.layers.77.self_attn.q_norm.weight": "model-00078-of-00092.safetensors",
+ "model.layers.77.self_attn.q_proj.bias": "model-00078-of-00092.safetensors",
+ "model.layers.77.self_attn.q_proj.weight": "model-00078-of-00092.safetensors",
+ "model.layers.77.self_attn.q_proj.weight_scale": "model-00078-of-00092.safetensors",
+ "model.layers.77.self_attn.v_proj.bias": "model-00078-of-00092.safetensors",
+ "model.layers.77.self_attn.v_proj.weight": "model-00078-of-00092.safetensors",
+ "model.layers.77.self_attn.v_proj.weight_scale": "model-00078-of-00092.safetensors",
+ "model.layers.78.input_layernorm.weight": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.0.down_proj.weight": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.0.down_proj.weight_scale": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.0.gate_proj.weight": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.0.gate_proj.weight_scale": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.0.up_proj.weight": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.0.up_proj.weight_scale": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.1.down_proj.weight": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.1.down_proj.weight_scale": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.1.gate_proj.weight": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.1.gate_proj.weight_scale": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.1.up_proj.weight": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.1.up_proj.weight_scale": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.10.down_proj.weight": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.10.down_proj.weight_scale": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.10.gate_proj.weight": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.10.gate_proj.weight_scale": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.10.up_proj.weight": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.10.up_proj.weight_scale": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.100.down_proj.weight": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.100.down_proj.weight_scale": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.100.gate_proj.weight": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.100.gate_proj.weight_scale": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.100.up_proj.weight": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.100.up_proj.weight_scale": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.101.down_proj.weight": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.101.down_proj.weight_scale": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.101.gate_proj.weight": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.101.gate_proj.weight_scale": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.101.up_proj.weight": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.101.up_proj.weight_scale": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.102.down_proj.weight": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.102.down_proj.weight_scale": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.102.gate_proj.weight": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.102.gate_proj.weight_scale": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.102.up_proj.weight": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.102.up_proj.weight_scale": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.103.down_proj.weight": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.103.down_proj.weight_scale": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.103.gate_proj.weight": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.103.gate_proj.weight_scale": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.103.up_proj.weight": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.103.up_proj.weight_scale": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.104.down_proj.weight": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.104.down_proj.weight_scale": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.104.gate_proj.weight": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.104.gate_proj.weight_scale": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.104.up_proj.weight": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.104.up_proj.weight_scale": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.105.down_proj.weight": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.105.down_proj.weight_scale": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.105.gate_proj.weight": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.105.gate_proj.weight_scale": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.105.up_proj.weight": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.105.up_proj.weight_scale": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.106.down_proj.weight": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.106.down_proj.weight_scale": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.106.gate_proj.weight": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.106.gate_proj.weight_scale": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.106.up_proj.weight": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.106.up_proj.weight_scale": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.107.down_proj.weight": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.107.down_proj.weight_scale": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.107.gate_proj.weight": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.107.gate_proj.weight_scale": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.107.up_proj.weight": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.107.up_proj.weight_scale": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.108.down_proj.weight": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.108.down_proj.weight_scale": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.108.gate_proj.weight": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.108.gate_proj.weight_scale": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.108.up_proj.weight": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.108.up_proj.weight_scale": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.109.down_proj.weight": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.109.down_proj.weight_scale": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.109.gate_proj.weight": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.109.gate_proj.weight_scale": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.109.up_proj.weight": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.109.up_proj.weight_scale": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.11.down_proj.weight": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.11.down_proj.weight_scale": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.11.gate_proj.weight": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.11.gate_proj.weight_scale": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.11.up_proj.weight": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.11.up_proj.weight_scale": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.110.down_proj.weight": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.110.down_proj.weight_scale": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.110.gate_proj.weight": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.110.gate_proj.weight_scale": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.110.up_proj.weight": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.110.up_proj.weight_scale": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.111.down_proj.weight": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.111.down_proj.weight_scale": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.111.gate_proj.weight": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.111.gate_proj.weight_scale": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.111.up_proj.weight": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.111.up_proj.weight_scale": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.112.down_proj.weight": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.112.down_proj.weight_scale": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.112.gate_proj.weight": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.112.gate_proj.weight_scale": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.112.up_proj.weight": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.112.up_proj.weight_scale": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.113.down_proj.weight": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.113.down_proj.weight_scale": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.113.gate_proj.weight": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.113.gate_proj.weight_scale": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.113.up_proj.weight": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.113.up_proj.weight_scale": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.114.down_proj.weight": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.114.down_proj.weight_scale": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.114.gate_proj.weight": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.114.gate_proj.weight_scale": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.114.up_proj.weight": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.114.up_proj.weight_scale": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.115.down_proj.weight": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.115.down_proj.weight_scale": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.115.gate_proj.weight": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.115.gate_proj.weight_scale": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.115.up_proj.weight": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.115.up_proj.weight_scale": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.116.down_proj.weight": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.116.down_proj.weight_scale": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.116.gate_proj.weight": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.116.gate_proj.weight_scale": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.116.up_proj.weight": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.116.up_proj.weight_scale": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.117.down_proj.weight": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.117.down_proj.weight_scale": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.117.gate_proj.weight": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.117.gate_proj.weight_scale": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.117.up_proj.weight": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.117.up_proj.weight_scale": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.118.down_proj.weight": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.118.down_proj.weight_scale": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.118.gate_proj.weight": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.118.gate_proj.weight_scale": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.118.up_proj.weight": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.118.up_proj.weight_scale": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.119.down_proj.weight": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.119.down_proj.weight_scale": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.119.gate_proj.weight": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.119.gate_proj.weight_scale": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.119.up_proj.weight": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.119.up_proj.weight_scale": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.12.down_proj.weight": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.12.down_proj.weight_scale": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.12.gate_proj.weight": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.12.gate_proj.weight_scale": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.12.up_proj.weight": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.12.up_proj.weight_scale": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.120.down_proj.weight": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.120.down_proj.weight_scale": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.120.gate_proj.weight": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.120.gate_proj.weight_scale": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.120.up_proj.weight": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.120.up_proj.weight_scale": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.121.down_proj.weight": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.121.down_proj.weight_scale": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.121.gate_proj.weight": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.121.gate_proj.weight_scale": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.121.up_proj.weight": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.121.up_proj.weight_scale": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.122.down_proj.weight": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.122.down_proj.weight_scale": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.122.gate_proj.weight": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.122.gate_proj.weight_scale": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.122.up_proj.weight": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.122.up_proj.weight_scale": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.123.down_proj.weight": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.123.down_proj.weight_scale": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.123.gate_proj.weight": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.123.gate_proj.weight_scale": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.123.up_proj.weight": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.123.up_proj.weight_scale": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.124.down_proj.weight": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.124.down_proj.weight_scale": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.124.gate_proj.weight": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.124.gate_proj.weight_scale": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.124.up_proj.weight": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.124.up_proj.weight_scale": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.125.down_proj.weight": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.125.down_proj.weight_scale": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.125.gate_proj.weight": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.125.gate_proj.weight_scale": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.125.up_proj.weight": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.125.up_proj.weight_scale": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.126.down_proj.weight": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.126.down_proj.weight_scale": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.126.gate_proj.weight": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.126.gate_proj.weight_scale": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.126.up_proj.weight": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.126.up_proj.weight_scale": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.127.down_proj.weight": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.127.down_proj.weight_scale": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.127.gate_proj.weight": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.127.gate_proj.weight_scale": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.127.up_proj.weight": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.127.up_proj.weight_scale": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.128.down_proj.weight": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.128.down_proj.weight_scale": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.128.gate_proj.weight": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.128.gate_proj.weight_scale": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.128.up_proj.weight": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.128.up_proj.weight_scale": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.129.down_proj.weight": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.129.down_proj.weight_scale": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.129.gate_proj.weight": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.129.gate_proj.weight_scale": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.129.up_proj.weight": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.129.up_proj.weight_scale": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.13.down_proj.weight": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.13.down_proj.weight_scale": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.13.gate_proj.weight": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.13.gate_proj.weight_scale": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.13.up_proj.weight": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.13.up_proj.weight_scale": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.130.down_proj.weight": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.130.down_proj.weight_scale": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.130.gate_proj.weight": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.130.gate_proj.weight_scale": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.130.up_proj.weight": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.130.up_proj.weight_scale": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.131.down_proj.weight": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.131.down_proj.weight_scale": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.131.gate_proj.weight": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.131.gate_proj.weight_scale": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.131.up_proj.weight": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.131.up_proj.weight_scale": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.132.down_proj.weight": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.132.down_proj.weight_scale": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.132.gate_proj.weight": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.132.gate_proj.weight_scale": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.132.up_proj.weight": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.132.up_proj.weight_scale": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.133.down_proj.weight": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.133.down_proj.weight_scale": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.133.gate_proj.weight": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.133.gate_proj.weight_scale": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.133.up_proj.weight": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.133.up_proj.weight_scale": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.134.down_proj.weight": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.134.down_proj.weight_scale": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.134.gate_proj.weight": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.134.gate_proj.weight_scale": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.134.up_proj.weight": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.134.up_proj.weight_scale": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.135.down_proj.weight": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.135.down_proj.weight_scale": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.135.gate_proj.weight": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.135.gate_proj.weight_scale": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.135.up_proj.weight": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.135.up_proj.weight_scale": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.136.down_proj.weight": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.136.down_proj.weight_scale": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.136.gate_proj.weight": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.136.gate_proj.weight_scale": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.136.up_proj.weight": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.136.up_proj.weight_scale": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.137.down_proj.weight": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.137.down_proj.weight_scale": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.137.gate_proj.weight": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.137.gate_proj.weight_scale": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.137.up_proj.weight": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.137.up_proj.weight_scale": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.138.down_proj.weight": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.138.down_proj.weight_scale": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.138.gate_proj.weight": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.138.gate_proj.weight_scale": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.138.up_proj.weight": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.138.up_proj.weight_scale": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.139.down_proj.weight": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.139.down_proj.weight_scale": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.139.gate_proj.weight": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.139.gate_proj.weight_scale": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.139.up_proj.weight": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.139.up_proj.weight_scale": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.14.down_proj.weight": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.14.down_proj.weight_scale": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.14.gate_proj.weight": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.14.gate_proj.weight_scale": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.14.up_proj.weight": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.14.up_proj.weight_scale": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.140.down_proj.weight": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.140.down_proj.weight_scale": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.140.gate_proj.weight": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.140.gate_proj.weight_scale": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.140.up_proj.weight": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.140.up_proj.weight_scale": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.141.down_proj.weight": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.141.down_proj.weight_scale": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.141.gate_proj.weight": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.141.gate_proj.weight_scale": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.141.up_proj.weight": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.141.up_proj.weight_scale": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.142.down_proj.weight": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.142.down_proj.weight_scale": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.142.gate_proj.weight": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.142.gate_proj.weight_scale": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.142.up_proj.weight": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.142.up_proj.weight_scale": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.143.down_proj.weight": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.143.down_proj.weight_scale": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.143.gate_proj.weight": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.143.gate_proj.weight_scale": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.143.up_proj.weight": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.143.up_proj.weight_scale": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.144.down_proj.weight": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.144.down_proj.weight_scale": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.144.gate_proj.weight": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.144.gate_proj.weight_scale": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.144.up_proj.weight": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.144.up_proj.weight_scale": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.145.down_proj.weight": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.145.down_proj.weight_scale": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.145.gate_proj.weight": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.145.gate_proj.weight_scale": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.145.up_proj.weight": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.145.up_proj.weight_scale": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.146.down_proj.weight": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.146.down_proj.weight_scale": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.146.gate_proj.weight": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.146.gate_proj.weight_scale": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.146.up_proj.weight": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.146.up_proj.weight_scale": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.147.down_proj.weight": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.147.down_proj.weight_scale": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.147.gate_proj.weight": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.147.gate_proj.weight_scale": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.147.up_proj.weight": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.147.up_proj.weight_scale": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.148.down_proj.weight": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.148.down_proj.weight_scale": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.148.gate_proj.weight": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.148.gate_proj.weight_scale": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.148.up_proj.weight": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.148.up_proj.weight_scale": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.149.down_proj.weight": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.149.down_proj.weight_scale": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.149.gate_proj.weight": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.149.gate_proj.weight_scale": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.149.up_proj.weight": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.149.up_proj.weight_scale": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.15.down_proj.weight": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.15.down_proj.weight_scale": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.15.gate_proj.weight": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.15.gate_proj.weight_scale": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.15.up_proj.weight": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.15.up_proj.weight_scale": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.150.down_proj.weight": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.150.down_proj.weight_scale": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.150.gate_proj.weight": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.150.gate_proj.weight_scale": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.150.up_proj.weight": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.150.up_proj.weight_scale": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.151.down_proj.weight": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.151.down_proj.weight_scale": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.151.gate_proj.weight": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.151.gate_proj.weight_scale": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.151.up_proj.weight": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.151.up_proj.weight_scale": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.152.down_proj.weight": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.152.down_proj.weight_scale": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.152.gate_proj.weight": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.152.gate_proj.weight_scale": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.152.up_proj.weight": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.152.up_proj.weight_scale": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.153.down_proj.weight": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.153.down_proj.weight_scale": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.153.gate_proj.weight": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.153.gate_proj.weight_scale": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.153.up_proj.weight": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.153.up_proj.weight_scale": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.154.down_proj.weight": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.154.down_proj.weight_scale": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.154.gate_proj.weight": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.154.gate_proj.weight_scale": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.154.up_proj.weight": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.154.up_proj.weight_scale": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.155.down_proj.weight": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.155.down_proj.weight_scale": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.155.gate_proj.weight": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.155.gate_proj.weight_scale": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.155.up_proj.weight": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.155.up_proj.weight_scale": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.156.down_proj.weight": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.156.down_proj.weight_scale": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.156.gate_proj.weight": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.156.gate_proj.weight_scale": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.156.up_proj.weight": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.156.up_proj.weight_scale": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.157.down_proj.weight": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.157.down_proj.weight_scale": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.157.gate_proj.weight": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.157.gate_proj.weight_scale": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.157.up_proj.weight": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.157.up_proj.weight_scale": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.158.down_proj.weight": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.158.down_proj.weight_scale": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.158.gate_proj.weight": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.158.gate_proj.weight_scale": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.158.up_proj.weight": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.158.up_proj.weight_scale": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.159.down_proj.weight": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.159.down_proj.weight_scale": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.159.gate_proj.weight": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.159.gate_proj.weight_scale": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.159.up_proj.weight": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.159.up_proj.weight_scale": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.16.down_proj.weight": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.16.down_proj.weight_scale": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.16.gate_proj.weight": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.16.gate_proj.weight_scale": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.16.up_proj.weight": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.16.up_proj.weight_scale": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.17.down_proj.weight": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.17.down_proj.weight_scale": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.17.gate_proj.weight": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.17.gate_proj.weight_scale": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.17.up_proj.weight": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.17.up_proj.weight_scale": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.18.down_proj.weight": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.18.down_proj.weight_scale": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.18.gate_proj.weight": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.18.gate_proj.weight_scale": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.18.up_proj.weight": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.18.up_proj.weight_scale": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.19.down_proj.weight": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.19.down_proj.weight_scale": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.19.gate_proj.weight": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.19.gate_proj.weight_scale": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.19.up_proj.weight": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.19.up_proj.weight_scale": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.2.down_proj.weight": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.2.down_proj.weight_scale": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.2.gate_proj.weight": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.2.gate_proj.weight_scale": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.2.up_proj.weight": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.2.up_proj.weight_scale": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.20.down_proj.weight": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.20.down_proj.weight_scale": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.20.gate_proj.weight": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.20.gate_proj.weight_scale": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.20.up_proj.weight": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.20.up_proj.weight_scale": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.21.down_proj.weight": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.21.down_proj.weight_scale": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.21.gate_proj.weight": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.21.gate_proj.weight_scale": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.21.up_proj.weight": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.21.up_proj.weight_scale": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.22.down_proj.weight": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.22.down_proj.weight_scale": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.22.gate_proj.weight": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.22.gate_proj.weight_scale": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.22.up_proj.weight": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.22.up_proj.weight_scale": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.23.down_proj.weight": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.23.down_proj.weight_scale": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.23.gate_proj.weight": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.23.gate_proj.weight_scale": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.23.up_proj.weight": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.23.up_proj.weight_scale": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.24.down_proj.weight": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.24.down_proj.weight_scale": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.24.gate_proj.weight": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.24.gate_proj.weight_scale": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.24.up_proj.weight": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.24.up_proj.weight_scale": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.25.down_proj.weight": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.25.down_proj.weight_scale": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.25.gate_proj.weight": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.25.gate_proj.weight_scale": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.25.up_proj.weight": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.25.up_proj.weight_scale": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.26.down_proj.weight": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.26.down_proj.weight_scale": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.26.gate_proj.weight": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.26.gate_proj.weight_scale": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.26.up_proj.weight": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.26.up_proj.weight_scale": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.27.down_proj.weight": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.27.down_proj.weight_scale": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.27.gate_proj.weight": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.27.gate_proj.weight_scale": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.27.up_proj.weight": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.27.up_proj.weight_scale": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.28.down_proj.weight": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.28.down_proj.weight_scale": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.28.gate_proj.weight": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.28.gate_proj.weight_scale": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.28.up_proj.weight": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.28.up_proj.weight_scale": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.29.down_proj.weight": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.29.down_proj.weight_scale": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.29.gate_proj.weight": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.29.gate_proj.weight_scale": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.29.up_proj.weight": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.29.up_proj.weight_scale": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.3.down_proj.weight": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.3.down_proj.weight_scale": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.3.gate_proj.weight": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.3.gate_proj.weight_scale": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.3.up_proj.weight": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.3.up_proj.weight_scale": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.30.down_proj.weight": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.30.down_proj.weight_scale": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.30.gate_proj.weight": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.30.gate_proj.weight_scale": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.30.up_proj.weight": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.30.up_proj.weight_scale": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.31.down_proj.weight": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.31.down_proj.weight_scale": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.31.gate_proj.weight": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.31.gate_proj.weight_scale": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.31.up_proj.weight": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.31.up_proj.weight_scale": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.32.down_proj.weight": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.32.down_proj.weight_scale": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.32.gate_proj.weight": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.32.gate_proj.weight_scale": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.32.up_proj.weight": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.32.up_proj.weight_scale": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.33.down_proj.weight": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.33.down_proj.weight_scale": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.33.gate_proj.weight": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.33.gate_proj.weight_scale": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.33.up_proj.weight": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.33.up_proj.weight_scale": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.34.down_proj.weight": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.34.down_proj.weight_scale": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.34.gate_proj.weight": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.34.gate_proj.weight_scale": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.34.up_proj.weight": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.34.up_proj.weight_scale": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.35.down_proj.weight": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.35.down_proj.weight_scale": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.35.gate_proj.weight": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.35.gate_proj.weight_scale": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.35.up_proj.weight": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.35.up_proj.weight_scale": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.36.down_proj.weight": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.36.down_proj.weight_scale": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.36.gate_proj.weight": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.36.gate_proj.weight_scale": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.36.up_proj.weight": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.36.up_proj.weight_scale": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.37.down_proj.weight": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.37.down_proj.weight_scale": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.37.gate_proj.weight": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.37.gate_proj.weight_scale": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.37.up_proj.weight": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.37.up_proj.weight_scale": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.38.down_proj.weight": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.38.down_proj.weight_scale": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.38.gate_proj.weight": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.38.gate_proj.weight_scale": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.38.up_proj.weight": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.38.up_proj.weight_scale": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.39.down_proj.weight": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.39.down_proj.weight_scale": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.39.gate_proj.weight": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.39.gate_proj.weight_scale": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.39.up_proj.weight": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.39.up_proj.weight_scale": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.4.down_proj.weight": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.4.down_proj.weight_scale": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.4.gate_proj.weight": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.4.gate_proj.weight_scale": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.4.up_proj.weight": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.4.up_proj.weight_scale": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.40.down_proj.weight": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.40.down_proj.weight_scale": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.40.gate_proj.weight": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.40.gate_proj.weight_scale": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.40.up_proj.weight": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.40.up_proj.weight_scale": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.41.down_proj.weight": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.41.down_proj.weight_scale": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.41.gate_proj.weight": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.41.gate_proj.weight_scale": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.41.up_proj.weight": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.41.up_proj.weight_scale": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.42.down_proj.weight": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.42.down_proj.weight_scale": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.42.gate_proj.weight": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.42.gate_proj.weight_scale": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.42.up_proj.weight": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.42.up_proj.weight_scale": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.43.down_proj.weight": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.43.down_proj.weight_scale": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.43.gate_proj.weight": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.43.gate_proj.weight_scale": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.43.up_proj.weight": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.43.up_proj.weight_scale": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.44.down_proj.weight": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.44.down_proj.weight_scale": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.44.gate_proj.weight": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.44.gate_proj.weight_scale": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.44.up_proj.weight": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.44.up_proj.weight_scale": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.45.down_proj.weight": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.45.down_proj.weight_scale": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.45.gate_proj.weight": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.45.gate_proj.weight_scale": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.45.up_proj.weight": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.45.up_proj.weight_scale": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.46.down_proj.weight": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.46.down_proj.weight_scale": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.46.gate_proj.weight": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.46.gate_proj.weight_scale": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.46.up_proj.weight": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.46.up_proj.weight_scale": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.47.down_proj.weight": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.47.down_proj.weight_scale": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.47.gate_proj.weight": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.47.gate_proj.weight_scale": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.47.up_proj.weight": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.47.up_proj.weight_scale": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.48.down_proj.weight": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.48.down_proj.weight_scale": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.48.gate_proj.weight": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.48.gate_proj.weight_scale": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.48.up_proj.weight": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.48.up_proj.weight_scale": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.49.down_proj.weight": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.49.down_proj.weight_scale": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.49.gate_proj.weight": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.49.gate_proj.weight_scale": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.49.up_proj.weight": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.49.up_proj.weight_scale": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.5.down_proj.weight": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.5.down_proj.weight_scale": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.5.gate_proj.weight": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.5.gate_proj.weight_scale": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.5.up_proj.weight": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.5.up_proj.weight_scale": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.50.down_proj.weight": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.50.down_proj.weight_scale": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.50.gate_proj.weight": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.50.gate_proj.weight_scale": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.50.up_proj.weight": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.50.up_proj.weight_scale": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.51.down_proj.weight": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.51.down_proj.weight_scale": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.51.gate_proj.weight": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.51.gate_proj.weight_scale": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.51.up_proj.weight": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.51.up_proj.weight_scale": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.52.down_proj.weight": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.52.down_proj.weight_scale": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.52.gate_proj.weight": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.52.gate_proj.weight_scale": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.52.up_proj.weight": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.52.up_proj.weight_scale": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.53.down_proj.weight": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.53.down_proj.weight_scale": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.53.gate_proj.weight": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.53.gate_proj.weight_scale": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.53.up_proj.weight": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.53.up_proj.weight_scale": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.54.down_proj.weight": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.54.down_proj.weight_scale": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.54.gate_proj.weight": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.54.gate_proj.weight_scale": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.54.up_proj.weight": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.54.up_proj.weight_scale": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.55.down_proj.weight": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.55.down_proj.weight_scale": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.55.gate_proj.weight": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.55.gate_proj.weight_scale": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.55.up_proj.weight": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.55.up_proj.weight_scale": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.56.down_proj.weight": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.56.down_proj.weight_scale": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.56.gate_proj.weight": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.56.gate_proj.weight_scale": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.56.up_proj.weight": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.56.up_proj.weight_scale": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.57.down_proj.weight": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.57.down_proj.weight_scale": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.57.gate_proj.weight": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.57.gate_proj.weight_scale": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.57.up_proj.weight": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.57.up_proj.weight_scale": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.58.down_proj.weight": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.58.down_proj.weight_scale": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.58.gate_proj.weight": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.58.gate_proj.weight_scale": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.58.up_proj.weight": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.58.up_proj.weight_scale": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.59.down_proj.weight": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.59.down_proj.weight_scale": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.59.gate_proj.weight": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.59.gate_proj.weight_scale": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.59.up_proj.weight": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.59.up_proj.weight_scale": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.6.down_proj.weight": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.6.down_proj.weight_scale": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.6.gate_proj.weight": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.6.gate_proj.weight_scale": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.6.up_proj.weight": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.6.up_proj.weight_scale": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.60.down_proj.weight": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.60.down_proj.weight_scale": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.60.gate_proj.weight": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.60.gate_proj.weight_scale": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.60.up_proj.weight": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.60.up_proj.weight_scale": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.61.down_proj.weight": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.61.down_proj.weight_scale": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.61.gate_proj.weight": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.61.gate_proj.weight_scale": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.61.up_proj.weight": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.61.up_proj.weight_scale": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.62.down_proj.weight": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.62.down_proj.weight_scale": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.62.gate_proj.weight": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.62.gate_proj.weight_scale": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.62.up_proj.weight": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.62.up_proj.weight_scale": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.63.down_proj.weight": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.63.down_proj.weight_scale": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.63.gate_proj.weight": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.63.gate_proj.weight_scale": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.63.up_proj.weight": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.63.up_proj.weight_scale": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.64.down_proj.weight": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.64.down_proj.weight_scale": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.64.gate_proj.weight": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.64.gate_proj.weight_scale": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.64.up_proj.weight": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.64.up_proj.weight_scale": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.65.down_proj.weight": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.65.down_proj.weight_scale": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.65.gate_proj.weight": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.65.gate_proj.weight_scale": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.65.up_proj.weight": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.65.up_proj.weight_scale": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.66.down_proj.weight": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.66.down_proj.weight_scale": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.66.gate_proj.weight": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.66.gate_proj.weight_scale": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.66.up_proj.weight": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.66.up_proj.weight_scale": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.67.down_proj.weight": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.67.down_proj.weight_scale": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.67.gate_proj.weight": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.67.gate_proj.weight_scale": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.67.up_proj.weight": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.67.up_proj.weight_scale": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.68.down_proj.weight": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.68.down_proj.weight_scale": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.68.gate_proj.weight": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.68.gate_proj.weight_scale": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.68.up_proj.weight": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.68.up_proj.weight_scale": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.69.down_proj.weight": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.69.down_proj.weight_scale": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.69.gate_proj.weight": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.69.gate_proj.weight_scale": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.69.up_proj.weight": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.69.up_proj.weight_scale": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.7.down_proj.weight": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.7.down_proj.weight_scale": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.7.gate_proj.weight": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.7.gate_proj.weight_scale": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.7.up_proj.weight": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.7.up_proj.weight_scale": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.70.down_proj.weight": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.70.down_proj.weight_scale": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.70.gate_proj.weight": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.70.gate_proj.weight_scale": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.70.up_proj.weight": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.70.up_proj.weight_scale": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.71.down_proj.weight": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.71.down_proj.weight_scale": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.71.gate_proj.weight": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.71.gate_proj.weight_scale": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.71.up_proj.weight": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.71.up_proj.weight_scale": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.72.down_proj.weight": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.72.down_proj.weight_scale": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.72.gate_proj.weight": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.72.gate_proj.weight_scale": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.72.up_proj.weight": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.72.up_proj.weight_scale": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.73.down_proj.weight": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.73.down_proj.weight_scale": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.73.gate_proj.weight": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.73.gate_proj.weight_scale": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.73.up_proj.weight": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.73.up_proj.weight_scale": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.74.down_proj.weight": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.74.down_proj.weight_scale": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.74.gate_proj.weight": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.74.gate_proj.weight_scale": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.74.up_proj.weight": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.74.up_proj.weight_scale": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.75.down_proj.weight": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.75.down_proj.weight_scale": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.75.gate_proj.weight": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.75.gate_proj.weight_scale": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.75.up_proj.weight": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.75.up_proj.weight_scale": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.76.down_proj.weight": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.76.down_proj.weight_scale": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.76.gate_proj.weight": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.76.gate_proj.weight_scale": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.76.up_proj.weight": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.76.up_proj.weight_scale": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.77.down_proj.weight": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.77.down_proj.weight_scale": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.77.gate_proj.weight": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.77.gate_proj.weight_scale": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.77.up_proj.weight": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.77.up_proj.weight_scale": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.78.down_proj.weight": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.78.down_proj.weight_scale": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.78.gate_proj.weight": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.78.gate_proj.weight_scale": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.78.up_proj.weight": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.78.up_proj.weight_scale": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.79.down_proj.weight": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.79.down_proj.weight_scale": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.79.gate_proj.weight": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.79.gate_proj.weight_scale": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.79.up_proj.weight": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.79.up_proj.weight_scale": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.8.down_proj.weight": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.8.down_proj.weight_scale": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.8.gate_proj.weight": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.8.gate_proj.weight_scale": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.8.up_proj.weight": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.8.up_proj.weight_scale": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.80.down_proj.weight": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.80.down_proj.weight_scale": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.80.gate_proj.weight": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.80.gate_proj.weight_scale": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.80.up_proj.weight": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.80.up_proj.weight_scale": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.81.down_proj.weight": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.81.down_proj.weight_scale": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.81.gate_proj.weight": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.81.gate_proj.weight_scale": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.81.up_proj.weight": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.81.up_proj.weight_scale": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.82.down_proj.weight": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.82.down_proj.weight_scale": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.82.gate_proj.weight": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.82.gate_proj.weight_scale": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.82.up_proj.weight": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.82.up_proj.weight_scale": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.83.down_proj.weight": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.83.down_proj.weight_scale": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.83.gate_proj.weight": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.83.gate_proj.weight_scale": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.83.up_proj.weight": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.83.up_proj.weight_scale": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.84.down_proj.weight": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.84.down_proj.weight_scale": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.84.gate_proj.weight": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.84.gate_proj.weight_scale": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.84.up_proj.weight": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.84.up_proj.weight_scale": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.85.down_proj.weight": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.85.down_proj.weight_scale": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.85.gate_proj.weight": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.85.gate_proj.weight_scale": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.85.up_proj.weight": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.85.up_proj.weight_scale": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.86.down_proj.weight": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.86.down_proj.weight_scale": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.86.gate_proj.weight": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.86.gate_proj.weight_scale": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.86.up_proj.weight": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.86.up_proj.weight_scale": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.87.down_proj.weight": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.87.down_proj.weight_scale": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.87.gate_proj.weight": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.87.gate_proj.weight_scale": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.87.up_proj.weight": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.87.up_proj.weight_scale": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.88.down_proj.weight": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.88.down_proj.weight_scale": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.88.gate_proj.weight": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.88.gate_proj.weight_scale": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.88.up_proj.weight": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.88.up_proj.weight_scale": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.89.down_proj.weight": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.89.down_proj.weight_scale": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.89.gate_proj.weight": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.89.gate_proj.weight_scale": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.89.up_proj.weight": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.89.up_proj.weight_scale": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.9.down_proj.weight": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.9.down_proj.weight_scale": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.9.gate_proj.weight": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.9.gate_proj.weight_scale": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.9.up_proj.weight": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.9.up_proj.weight_scale": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.90.down_proj.weight": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.90.down_proj.weight_scale": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.90.gate_proj.weight": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.90.gate_proj.weight_scale": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.90.up_proj.weight": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.90.up_proj.weight_scale": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.91.down_proj.weight": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.91.down_proj.weight_scale": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.91.gate_proj.weight": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.91.gate_proj.weight_scale": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.91.up_proj.weight": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.91.up_proj.weight_scale": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.92.down_proj.weight": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.92.down_proj.weight_scale": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.92.gate_proj.weight": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.92.gate_proj.weight_scale": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.92.up_proj.weight": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.92.up_proj.weight_scale": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.93.down_proj.weight": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.93.down_proj.weight_scale": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.93.gate_proj.weight": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.93.gate_proj.weight_scale": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.93.up_proj.weight": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.93.up_proj.weight_scale": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.94.down_proj.weight": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.94.down_proj.weight_scale": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.94.gate_proj.weight": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.94.gate_proj.weight_scale": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.94.up_proj.weight": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.94.up_proj.weight_scale": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.95.down_proj.weight": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.95.down_proj.weight_scale": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.95.gate_proj.weight": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.95.gate_proj.weight_scale": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.95.up_proj.weight": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.95.up_proj.weight_scale": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.96.down_proj.weight": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.96.down_proj.weight_scale": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.96.gate_proj.weight": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.96.gate_proj.weight_scale": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.96.up_proj.weight": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.96.up_proj.weight_scale": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.97.down_proj.weight": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.97.down_proj.weight_scale": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.97.gate_proj.weight": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.97.gate_proj.weight_scale": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.97.up_proj.weight": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.97.up_proj.weight_scale": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.98.down_proj.weight": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.98.down_proj.weight_scale": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.98.gate_proj.weight": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.98.gate_proj.weight_scale": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.98.up_proj.weight": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.98.up_proj.weight_scale": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.99.down_proj.weight": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.99.down_proj.weight_scale": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.99.gate_proj.weight": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.99.gate_proj.weight_scale": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.99.up_proj.weight": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.99.up_proj.weight_scale": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.gate.e_score_correction_bias": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.gate.weight": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.shared_experts.down_proj.weight": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.shared_experts.down_proj.weight_scale": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.shared_experts.gate_proj.weight": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.shared_experts.gate_proj.weight_scale": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.shared_experts.up_proj.weight": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.shared_experts.up_proj.weight_scale": "model-00079-of-00092.safetensors",
+ "model.layers.78.post_attention_layernorm.weight": "model-00079-of-00092.safetensors",
+ "model.layers.78.self_attn.k_norm.weight": "model-00079-of-00092.safetensors",
+ "model.layers.78.self_attn.k_proj.bias": "model-00079-of-00092.safetensors",
+ "model.layers.78.self_attn.k_proj.weight": "model-00079-of-00092.safetensors",
+ "model.layers.78.self_attn.k_proj.weight_scale": "model-00079-of-00092.safetensors",
+ "model.layers.78.self_attn.o_proj.weight": "model-00079-of-00092.safetensors",
+ "model.layers.78.self_attn.o_proj.weight_scale": "model-00079-of-00092.safetensors",
+ "model.layers.78.self_attn.q_norm.weight": "model-00079-of-00092.safetensors",
+ "model.layers.78.self_attn.q_proj.bias": "model-00079-of-00092.safetensors",
+ "model.layers.78.self_attn.q_proj.weight": "model-00079-of-00092.safetensors",
+ "model.layers.78.self_attn.q_proj.weight_scale": "model-00079-of-00092.safetensors",
+ "model.layers.78.self_attn.v_proj.bias": "model-00079-of-00092.safetensors",
+ "model.layers.78.self_attn.v_proj.weight": "model-00079-of-00092.safetensors",
+ "model.layers.78.self_attn.v_proj.weight_scale": "model-00079-of-00092.safetensors",
+ "model.layers.79.input_layernorm.weight": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.0.down_proj.weight": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.0.down_proj.weight_scale": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.0.gate_proj.weight": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.0.gate_proj.weight_scale": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.0.up_proj.weight": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.0.up_proj.weight_scale": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.1.down_proj.weight": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.1.down_proj.weight_scale": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.1.gate_proj.weight": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.1.gate_proj.weight_scale": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.1.up_proj.weight": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.1.up_proj.weight_scale": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.10.down_proj.weight": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.10.down_proj.weight_scale": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.10.gate_proj.weight": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.10.gate_proj.weight_scale": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.10.up_proj.weight": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.10.up_proj.weight_scale": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.100.down_proj.weight": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.100.down_proj.weight_scale": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.100.gate_proj.weight": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.100.gate_proj.weight_scale": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.100.up_proj.weight": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.100.up_proj.weight_scale": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.101.down_proj.weight": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.101.down_proj.weight_scale": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.101.gate_proj.weight": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.101.gate_proj.weight_scale": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.101.up_proj.weight": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.101.up_proj.weight_scale": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.102.down_proj.weight": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.102.down_proj.weight_scale": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.102.gate_proj.weight": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.102.gate_proj.weight_scale": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.102.up_proj.weight": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.102.up_proj.weight_scale": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.103.down_proj.weight": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.103.down_proj.weight_scale": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.103.gate_proj.weight": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.103.gate_proj.weight_scale": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.103.up_proj.weight": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.103.up_proj.weight_scale": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.104.down_proj.weight": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.104.down_proj.weight_scale": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.104.gate_proj.weight": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.104.gate_proj.weight_scale": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.104.up_proj.weight": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.104.up_proj.weight_scale": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.105.down_proj.weight": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.105.down_proj.weight_scale": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.105.gate_proj.weight": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.105.gate_proj.weight_scale": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.105.up_proj.weight": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.105.up_proj.weight_scale": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.106.down_proj.weight": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.106.down_proj.weight_scale": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.106.gate_proj.weight": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.106.gate_proj.weight_scale": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.106.up_proj.weight": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.106.up_proj.weight_scale": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.107.down_proj.weight": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.107.down_proj.weight_scale": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.107.gate_proj.weight": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.107.gate_proj.weight_scale": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.107.up_proj.weight": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.107.up_proj.weight_scale": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.108.down_proj.weight": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.108.down_proj.weight_scale": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.108.gate_proj.weight": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.108.gate_proj.weight_scale": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.108.up_proj.weight": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.108.up_proj.weight_scale": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.109.down_proj.weight": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.109.down_proj.weight_scale": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.109.gate_proj.weight": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.109.gate_proj.weight_scale": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.109.up_proj.weight": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.109.up_proj.weight_scale": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.11.down_proj.weight": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.11.down_proj.weight_scale": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.11.gate_proj.weight": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.11.gate_proj.weight_scale": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.11.up_proj.weight": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.11.up_proj.weight_scale": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.110.down_proj.weight": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.110.down_proj.weight_scale": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.110.gate_proj.weight": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.110.gate_proj.weight_scale": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.110.up_proj.weight": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.110.up_proj.weight_scale": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.111.down_proj.weight": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.111.down_proj.weight_scale": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.111.gate_proj.weight": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.111.gate_proj.weight_scale": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.111.up_proj.weight": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.111.up_proj.weight_scale": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.112.down_proj.weight": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.112.down_proj.weight_scale": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.112.gate_proj.weight": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.112.gate_proj.weight_scale": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.112.up_proj.weight": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.112.up_proj.weight_scale": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.113.down_proj.weight": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.113.down_proj.weight_scale": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.113.gate_proj.weight": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.113.gate_proj.weight_scale": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.113.up_proj.weight": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.113.up_proj.weight_scale": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.114.down_proj.weight": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.114.down_proj.weight_scale": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.114.gate_proj.weight": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.114.gate_proj.weight_scale": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.114.up_proj.weight": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.114.up_proj.weight_scale": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.115.down_proj.weight": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.115.down_proj.weight_scale": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.115.gate_proj.weight": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.115.gate_proj.weight_scale": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.115.up_proj.weight": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.115.up_proj.weight_scale": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.116.down_proj.weight": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.116.down_proj.weight_scale": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.116.gate_proj.weight": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.116.gate_proj.weight_scale": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.116.up_proj.weight": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.116.up_proj.weight_scale": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.117.down_proj.weight": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.117.down_proj.weight_scale": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.117.gate_proj.weight": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.117.gate_proj.weight_scale": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.117.up_proj.weight": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.117.up_proj.weight_scale": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.118.down_proj.weight": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.118.down_proj.weight_scale": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.118.gate_proj.weight": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.118.gate_proj.weight_scale": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.118.up_proj.weight": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.118.up_proj.weight_scale": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.119.down_proj.weight": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.119.down_proj.weight_scale": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.119.gate_proj.weight": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.119.gate_proj.weight_scale": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.119.up_proj.weight": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.119.up_proj.weight_scale": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.12.down_proj.weight": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.12.down_proj.weight_scale": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.12.gate_proj.weight": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.12.gate_proj.weight_scale": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.12.up_proj.weight": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.12.up_proj.weight_scale": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.120.down_proj.weight": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.120.down_proj.weight_scale": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.120.gate_proj.weight": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.120.gate_proj.weight_scale": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.120.up_proj.weight": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.120.up_proj.weight_scale": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.121.down_proj.weight": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.121.down_proj.weight_scale": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.121.gate_proj.weight": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.121.gate_proj.weight_scale": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.121.up_proj.weight": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.121.up_proj.weight_scale": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.122.down_proj.weight": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.122.down_proj.weight_scale": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.122.gate_proj.weight": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.122.gate_proj.weight_scale": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.122.up_proj.weight": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.122.up_proj.weight_scale": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.123.down_proj.weight": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.123.down_proj.weight_scale": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.123.gate_proj.weight": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.123.gate_proj.weight_scale": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.123.up_proj.weight": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.123.up_proj.weight_scale": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.124.down_proj.weight": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.124.down_proj.weight_scale": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.124.gate_proj.weight": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.124.gate_proj.weight_scale": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.124.up_proj.weight": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.124.up_proj.weight_scale": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.125.down_proj.weight": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.125.down_proj.weight_scale": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.125.gate_proj.weight": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.125.gate_proj.weight_scale": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.125.up_proj.weight": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.125.up_proj.weight_scale": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.126.down_proj.weight": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.126.down_proj.weight_scale": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.126.gate_proj.weight": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.126.gate_proj.weight_scale": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.126.up_proj.weight": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.126.up_proj.weight_scale": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.127.down_proj.weight": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.127.down_proj.weight_scale": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.127.gate_proj.weight": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.127.gate_proj.weight_scale": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.127.up_proj.weight": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.127.up_proj.weight_scale": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.128.down_proj.weight": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.128.down_proj.weight_scale": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.128.gate_proj.weight": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.128.gate_proj.weight_scale": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.128.up_proj.weight": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.128.up_proj.weight_scale": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.129.down_proj.weight": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.129.down_proj.weight_scale": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.129.gate_proj.weight": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.129.gate_proj.weight_scale": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.129.up_proj.weight": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.129.up_proj.weight_scale": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.13.down_proj.weight": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.13.down_proj.weight_scale": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.13.gate_proj.weight": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.13.gate_proj.weight_scale": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.13.up_proj.weight": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.13.up_proj.weight_scale": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.130.down_proj.weight": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.130.down_proj.weight_scale": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.130.gate_proj.weight": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.130.gate_proj.weight_scale": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.130.up_proj.weight": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.130.up_proj.weight_scale": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.131.down_proj.weight": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.131.down_proj.weight_scale": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.131.gate_proj.weight": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.131.gate_proj.weight_scale": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.131.up_proj.weight": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.131.up_proj.weight_scale": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.132.down_proj.weight": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.132.down_proj.weight_scale": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.132.gate_proj.weight": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.132.gate_proj.weight_scale": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.132.up_proj.weight": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.132.up_proj.weight_scale": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.133.down_proj.weight": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.133.down_proj.weight_scale": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.133.gate_proj.weight": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.133.gate_proj.weight_scale": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.133.up_proj.weight": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.133.up_proj.weight_scale": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.134.down_proj.weight": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.134.down_proj.weight_scale": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.134.gate_proj.weight": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.134.gate_proj.weight_scale": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.134.up_proj.weight": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.134.up_proj.weight_scale": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.135.down_proj.weight": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.135.down_proj.weight_scale": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.135.gate_proj.weight": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.135.gate_proj.weight_scale": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.135.up_proj.weight": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.135.up_proj.weight_scale": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.136.down_proj.weight": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.136.down_proj.weight_scale": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.136.gate_proj.weight": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.136.gate_proj.weight_scale": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.136.up_proj.weight": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.136.up_proj.weight_scale": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.137.down_proj.weight": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.137.down_proj.weight_scale": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.137.gate_proj.weight": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.137.gate_proj.weight_scale": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.137.up_proj.weight": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.137.up_proj.weight_scale": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.138.down_proj.weight": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.138.down_proj.weight_scale": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.138.gate_proj.weight": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.138.gate_proj.weight_scale": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.138.up_proj.weight": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.138.up_proj.weight_scale": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.139.down_proj.weight": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.139.down_proj.weight_scale": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.139.gate_proj.weight": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.139.gate_proj.weight_scale": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.139.up_proj.weight": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.139.up_proj.weight_scale": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.14.down_proj.weight": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.14.down_proj.weight_scale": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.14.gate_proj.weight": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.14.gate_proj.weight_scale": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.14.up_proj.weight": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.14.up_proj.weight_scale": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.140.down_proj.weight": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.140.down_proj.weight_scale": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.140.gate_proj.weight": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.140.gate_proj.weight_scale": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.140.up_proj.weight": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.140.up_proj.weight_scale": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.141.down_proj.weight": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.141.down_proj.weight_scale": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.141.gate_proj.weight": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.141.gate_proj.weight_scale": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.141.up_proj.weight": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.141.up_proj.weight_scale": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.142.down_proj.weight": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.142.down_proj.weight_scale": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.142.gate_proj.weight": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.142.gate_proj.weight_scale": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.142.up_proj.weight": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.142.up_proj.weight_scale": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.143.down_proj.weight": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.143.down_proj.weight_scale": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.143.gate_proj.weight": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.143.gate_proj.weight_scale": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.143.up_proj.weight": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.143.up_proj.weight_scale": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.144.down_proj.weight": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.144.down_proj.weight_scale": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.144.gate_proj.weight": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.144.gate_proj.weight_scale": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.144.up_proj.weight": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.144.up_proj.weight_scale": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.145.down_proj.weight": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.145.down_proj.weight_scale": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.145.gate_proj.weight": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.145.gate_proj.weight_scale": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.145.up_proj.weight": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.145.up_proj.weight_scale": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.146.down_proj.weight": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.146.down_proj.weight_scale": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.146.gate_proj.weight": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.146.gate_proj.weight_scale": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.146.up_proj.weight": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.146.up_proj.weight_scale": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.147.down_proj.weight": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.147.down_proj.weight_scale": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.147.gate_proj.weight": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.147.gate_proj.weight_scale": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.147.up_proj.weight": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.147.up_proj.weight_scale": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.148.down_proj.weight": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.148.down_proj.weight_scale": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.148.gate_proj.weight": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.148.gate_proj.weight_scale": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.148.up_proj.weight": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.148.up_proj.weight_scale": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.149.down_proj.weight": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.149.down_proj.weight_scale": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.149.gate_proj.weight": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.149.gate_proj.weight_scale": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.149.up_proj.weight": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.149.up_proj.weight_scale": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.15.down_proj.weight": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.15.down_proj.weight_scale": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.15.gate_proj.weight": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.15.gate_proj.weight_scale": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.15.up_proj.weight": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.15.up_proj.weight_scale": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.150.down_proj.weight": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.150.down_proj.weight_scale": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.150.gate_proj.weight": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.150.gate_proj.weight_scale": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.150.up_proj.weight": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.150.up_proj.weight_scale": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.151.down_proj.weight": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.151.down_proj.weight_scale": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.151.gate_proj.weight": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.151.gate_proj.weight_scale": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.151.up_proj.weight": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.151.up_proj.weight_scale": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.152.down_proj.weight": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.152.down_proj.weight_scale": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.152.gate_proj.weight": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.152.gate_proj.weight_scale": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.152.up_proj.weight": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.152.up_proj.weight_scale": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.153.down_proj.weight": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.153.down_proj.weight_scale": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.153.gate_proj.weight": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.153.gate_proj.weight_scale": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.153.up_proj.weight": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.153.up_proj.weight_scale": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.154.down_proj.weight": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.154.down_proj.weight_scale": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.154.gate_proj.weight": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.154.gate_proj.weight_scale": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.154.up_proj.weight": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.154.up_proj.weight_scale": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.155.down_proj.weight": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.155.down_proj.weight_scale": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.155.gate_proj.weight": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.155.gate_proj.weight_scale": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.155.up_proj.weight": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.155.up_proj.weight_scale": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.156.down_proj.weight": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.156.down_proj.weight_scale": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.156.gate_proj.weight": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.156.gate_proj.weight_scale": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.156.up_proj.weight": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.156.up_proj.weight_scale": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.157.down_proj.weight": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.157.down_proj.weight_scale": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.157.gate_proj.weight": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.157.gate_proj.weight_scale": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.157.up_proj.weight": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.157.up_proj.weight_scale": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.158.down_proj.weight": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.158.down_proj.weight_scale": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.158.gate_proj.weight": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.158.gate_proj.weight_scale": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.158.up_proj.weight": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.158.up_proj.weight_scale": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.159.down_proj.weight": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.159.down_proj.weight_scale": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.159.gate_proj.weight": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.159.gate_proj.weight_scale": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.159.up_proj.weight": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.159.up_proj.weight_scale": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.16.down_proj.weight": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.16.down_proj.weight_scale": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.16.gate_proj.weight": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.16.gate_proj.weight_scale": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.16.up_proj.weight": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.16.up_proj.weight_scale": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.17.down_proj.weight": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.17.down_proj.weight_scale": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.17.gate_proj.weight": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.17.gate_proj.weight_scale": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.17.up_proj.weight": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.17.up_proj.weight_scale": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.18.down_proj.weight": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.18.down_proj.weight_scale": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.18.gate_proj.weight": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.18.gate_proj.weight_scale": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.18.up_proj.weight": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.18.up_proj.weight_scale": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.19.down_proj.weight": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.19.down_proj.weight_scale": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.19.gate_proj.weight": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.19.gate_proj.weight_scale": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.19.up_proj.weight": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.19.up_proj.weight_scale": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.2.down_proj.weight": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.2.down_proj.weight_scale": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.2.gate_proj.weight": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.2.gate_proj.weight_scale": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.2.up_proj.weight": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.2.up_proj.weight_scale": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.20.down_proj.weight": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.20.down_proj.weight_scale": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.20.gate_proj.weight": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.20.gate_proj.weight_scale": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.20.up_proj.weight": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.20.up_proj.weight_scale": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.21.down_proj.weight": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.21.down_proj.weight_scale": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.21.gate_proj.weight": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.21.gate_proj.weight_scale": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.21.up_proj.weight": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.21.up_proj.weight_scale": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.22.down_proj.weight": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.22.down_proj.weight_scale": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.22.gate_proj.weight": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.22.gate_proj.weight_scale": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.22.up_proj.weight": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.22.up_proj.weight_scale": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.23.down_proj.weight": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.23.down_proj.weight_scale": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.23.gate_proj.weight": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.23.gate_proj.weight_scale": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.23.up_proj.weight": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.23.up_proj.weight_scale": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.24.down_proj.weight": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.24.down_proj.weight_scale": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.24.gate_proj.weight": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.24.gate_proj.weight_scale": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.24.up_proj.weight": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.24.up_proj.weight_scale": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.25.down_proj.weight": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.25.down_proj.weight_scale": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.25.gate_proj.weight": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.25.gate_proj.weight_scale": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.25.up_proj.weight": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.25.up_proj.weight_scale": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.26.down_proj.weight": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.26.down_proj.weight_scale": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.26.gate_proj.weight": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.26.gate_proj.weight_scale": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.26.up_proj.weight": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.26.up_proj.weight_scale": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.27.down_proj.weight": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.27.down_proj.weight_scale": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.27.gate_proj.weight": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.27.gate_proj.weight_scale": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.27.up_proj.weight": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.27.up_proj.weight_scale": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.28.down_proj.weight": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.28.down_proj.weight_scale": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.28.gate_proj.weight": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.28.gate_proj.weight_scale": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.28.up_proj.weight": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.28.up_proj.weight_scale": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.29.down_proj.weight": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.29.down_proj.weight_scale": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.29.gate_proj.weight": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.29.gate_proj.weight_scale": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.29.up_proj.weight": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.29.up_proj.weight_scale": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.3.down_proj.weight": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.3.down_proj.weight_scale": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.3.gate_proj.weight": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.3.gate_proj.weight_scale": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.3.up_proj.weight": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.3.up_proj.weight_scale": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.30.down_proj.weight": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.30.down_proj.weight_scale": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.30.gate_proj.weight": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.30.gate_proj.weight_scale": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.30.up_proj.weight": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.30.up_proj.weight_scale": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.31.down_proj.weight": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.31.down_proj.weight_scale": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.31.gate_proj.weight": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.31.gate_proj.weight_scale": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.31.up_proj.weight": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.31.up_proj.weight_scale": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.32.down_proj.weight": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.32.down_proj.weight_scale": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.32.gate_proj.weight": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.32.gate_proj.weight_scale": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.32.up_proj.weight": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.32.up_proj.weight_scale": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.33.down_proj.weight": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.33.down_proj.weight_scale": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.33.gate_proj.weight": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.33.gate_proj.weight_scale": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.33.up_proj.weight": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.33.up_proj.weight_scale": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.34.down_proj.weight": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.34.down_proj.weight_scale": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.34.gate_proj.weight": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.34.gate_proj.weight_scale": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.34.up_proj.weight": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.34.up_proj.weight_scale": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.35.down_proj.weight": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.35.down_proj.weight_scale": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.35.gate_proj.weight": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.35.gate_proj.weight_scale": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.35.up_proj.weight": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.35.up_proj.weight_scale": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.36.down_proj.weight": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.36.down_proj.weight_scale": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.36.gate_proj.weight": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.36.gate_proj.weight_scale": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.36.up_proj.weight": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.36.up_proj.weight_scale": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.37.down_proj.weight": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.37.down_proj.weight_scale": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.37.gate_proj.weight": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.37.gate_proj.weight_scale": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.37.up_proj.weight": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.37.up_proj.weight_scale": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.38.down_proj.weight": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.38.down_proj.weight_scale": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.38.gate_proj.weight": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.38.gate_proj.weight_scale": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.38.up_proj.weight": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.38.up_proj.weight_scale": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.39.down_proj.weight": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.39.down_proj.weight_scale": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.39.gate_proj.weight": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.39.gate_proj.weight_scale": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.39.up_proj.weight": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.39.up_proj.weight_scale": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.4.down_proj.weight": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.4.down_proj.weight_scale": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.4.gate_proj.weight": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.4.gate_proj.weight_scale": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.4.up_proj.weight": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.4.up_proj.weight_scale": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.40.down_proj.weight": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.40.down_proj.weight_scale": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.40.gate_proj.weight": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.40.gate_proj.weight_scale": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.40.up_proj.weight": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.40.up_proj.weight_scale": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.41.down_proj.weight": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.41.down_proj.weight_scale": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.41.gate_proj.weight": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.41.gate_proj.weight_scale": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.41.up_proj.weight": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.41.up_proj.weight_scale": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.42.down_proj.weight": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.42.down_proj.weight_scale": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.42.gate_proj.weight": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.42.gate_proj.weight_scale": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.42.up_proj.weight": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.42.up_proj.weight_scale": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.43.down_proj.weight": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.43.down_proj.weight_scale": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.43.gate_proj.weight": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.43.gate_proj.weight_scale": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.43.up_proj.weight": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.43.up_proj.weight_scale": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.44.down_proj.weight": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.44.down_proj.weight_scale": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.44.gate_proj.weight": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.44.gate_proj.weight_scale": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.44.up_proj.weight": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.44.up_proj.weight_scale": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.45.down_proj.weight": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.45.down_proj.weight_scale": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.45.gate_proj.weight": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.45.gate_proj.weight_scale": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.45.up_proj.weight": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.45.up_proj.weight_scale": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.46.down_proj.weight": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.46.down_proj.weight_scale": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.46.gate_proj.weight": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.46.gate_proj.weight_scale": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.46.up_proj.weight": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.46.up_proj.weight_scale": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.47.down_proj.weight": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.47.down_proj.weight_scale": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.47.gate_proj.weight": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.47.gate_proj.weight_scale": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.47.up_proj.weight": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.47.up_proj.weight_scale": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.48.down_proj.weight": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.48.down_proj.weight_scale": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.48.gate_proj.weight": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.48.gate_proj.weight_scale": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.48.up_proj.weight": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.48.up_proj.weight_scale": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.49.down_proj.weight": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.49.down_proj.weight_scale": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.49.gate_proj.weight": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.49.gate_proj.weight_scale": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.49.up_proj.weight": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.49.up_proj.weight_scale": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.5.down_proj.weight": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.5.down_proj.weight_scale": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.5.gate_proj.weight": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.5.gate_proj.weight_scale": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.5.up_proj.weight": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.5.up_proj.weight_scale": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.50.down_proj.weight": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.50.down_proj.weight_scale": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.50.gate_proj.weight": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.50.gate_proj.weight_scale": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.50.up_proj.weight": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.50.up_proj.weight_scale": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.51.down_proj.weight": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.51.down_proj.weight_scale": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.51.gate_proj.weight": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.51.gate_proj.weight_scale": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.51.up_proj.weight": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.51.up_proj.weight_scale": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.52.down_proj.weight": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.52.down_proj.weight_scale": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.52.gate_proj.weight": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.52.gate_proj.weight_scale": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.52.up_proj.weight": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.52.up_proj.weight_scale": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.53.down_proj.weight": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.53.down_proj.weight_scale": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.53.gate_proj.weight": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.53.gate_proj.weight_scale": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.53.up_proj.weight": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.53.up_proj.weight_scale": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.54.down_proj.weight": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.54.down_proj.weight_scale": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.54.gate_proj.weight": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.54.gate_proj.weight_scale": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.54.up_proj.weight": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.54.up_proj.weight_scale": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.55.down_proj.weight": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.55.down_proj.weight_scale": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.55.gate_proj.weight": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.55.gate_proj.weight_scale": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.55.up_proj.weight": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.55.up_proj.weight_scale": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.56.down_proj.weight": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.56.down_proj.weight_scale": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.56.gate_proj.weight": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.56.gate_proj.weight_scale": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.56.up_proj.weight": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.56.up_proj.weight_scale": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.57.down_proj.weight": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.57.down_proj.weight_scale": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.57.gate_proj.weight": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.57.gate_proj.weight_scale": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.57.up_proj.weight": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.57.up_proj.weight_scale": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.58.down_proj.weight": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.58.down_proj.weight_scale": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.58.gate_proj.weight": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.58.gate_proj.weight_scale": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.58.up_proj.weight": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.58.up_proj.weight_scale": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.59.down_proj.weight": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.59.down_proj.weight_scale": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.59.gate_proj.weight": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.59.gate_proj.weight_scale": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.59.up_proj.weight": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.59.up_proj.weight_scale": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.6.down_proj.weight": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.6.down_proj.weight_scale": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.6.gate_proj.weight": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.6.gate_proj.weight_scale": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.6.up_proj.weight": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.6.up_proj.weight_scale": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.60.down_proj.weight": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.60.down_proj.weight_scale": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.60.gate_proj.weight": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.60.gate_proj.weight_scale": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.60.up_proj.weight": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.60.up_proj.weight_scale": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.61.down_proj.weight": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.61.down_proj.weight_scale": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.61.gate_proj.weight": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.61.gate_proj.weight_scale": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.61.up_proj.weight": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.61.up_proj.weight_scale": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.62.down_proj.weight": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.62.down_proj.weight_scale": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.62.gate_proj.weight": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.62.gate_proj.weight_scale": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.62.up_proj.weight": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.62.up_proj.weight_scale": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.63.down_proj.weight": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.63.down_proj.weight_scale": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.63.gate_proj.weight": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.63.gate_proj.weight_scale": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.63.up_proj.weight": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.63.up_proj.weight_scale": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.64.down_proj.weight": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.64.down_proj.weight_scale": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.64.gate_proj.weight": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.64.gate_proj.weight_scale": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.64.up_proj.weight": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.64.up_proj.weight_scale": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.65.down_proj.weight": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.65.down_proj.weight_scale": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.65.gate_proj.weight": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.65.gate_proj.weight_scale": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.65.up_proj.weight": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.65.up_proj.weight_scale": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.66.down_proj.weight": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.66.down_proj.weight_scale": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.66.gate_proj.weight": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.66.gate_proj.weight_scale": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.66.up_proj.weight": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.66.up_proj.weight_scale": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.67.down_proj.weight": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.67.down_proj.weight_scale": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.67.gate_proj.weight": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.67.gate_proj.weight_scale": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.67.up_proj.weight": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.67.up_proj.weight_scale": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.68.down_proj.weight": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.68.down_proj.weight_scale": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.68.gate_proj.weight": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.68.gate_proj.weight_scale": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.68.up_proj.weight": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.68.up_proj.weight_scale": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.69.down_proj.weight": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.69.down_proj.weight_scale": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.69.gate_proj.weight": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.69.gate_proj.weight_scale": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.69.up_proj.weight": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.69.up_proj.weight_scale": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.7.down_proj.weight": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.7.down_proj.weight_scale": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.7.gate_proj.weight": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.7.gate_proj.weight_scale": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.7.up_proj.weight": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.7.up_proj.weight_scale": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.70.down_proj.weight": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.70.down_proj.weight_scale": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.70.gate_proj.weight": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.70.gate_proj.weight_scale": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.70.up_proj.weight": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.70.up_proj.weight_scale": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.71.down_proj.weight": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.71.down_proj.weight_scale": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.71.gate_proj.weight": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.71.gate_proj.weight_scale": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.71.up_proj.weight": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.71.up_proj.weight_scale": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.72.down_proj.weight": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.72.down_proj.weight_scale": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.72.gate_proj.weight": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.72.gate_proj.weight_scale": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.72.up_proj.weight": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.72.up_proj.weight_scale": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.73.down_proj.weight": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.73.down_proj.weight_scale": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.73.gate_proj.weight": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.73.gate_proj.weight_scale": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.73.up_proj.weight": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.73.up_proj.weight_scale": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.74.down_proj.weight": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.74.down_proj.weight_scale": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.74.gate_proj.weight": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.74.gate_proj.weight_scale": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.74.up_proj.weight": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.74.up_proj.weight_scale": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.75.down_proj.weight": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.75.down_proj.weight_scale": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.75.gate_proj.weight": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.75.gate_proj.weight_scale": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.75.up_proj.weight": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.75.up_proj.weight_scale": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.76.down_proj.weight": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.76.down_proj.weight_scale": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.76.gate_proj.weight": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.76.gate_proj.weight_scale": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.76.up_proj.weight": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.76.up_proj.weight_scale": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.77.down_proj.weight": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.77.down_proj.weight_scale": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.77.gate_proj.weight": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.77.gate_proj.weight_scale": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.77.up_proj.weight": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.77.up_proj.weight_scale": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.78.down_proj.weight": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.78.down_proj.weight_scale": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.78.gate_proj.weight": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.78.gate_proj.weight_scale": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.78.up_proj.weight": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.78.up_proj.weight_scale": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.79.down_proj.weight": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.79.down_proj.weight_scale": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.79.gate_proj.weight": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.79.gate_proj.weight_scale": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.79.up_proj.weight": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.79.up_proj.weight_scale": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.8.down_proj.weight": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.8.down_proj.weight_scale": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.8.gate_proj.weight": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.8.gate_proj.weight_scale": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.8.up_proj.weight": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.8.up_proj.weight_scale": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.80.down_proj.weight": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.80.down_proj.weight_scale": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.80.gate_proj.weight": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.80.gate_proj.weight_scale": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.80.up_proj.weight": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.80.up_proj.weight_scale": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.81.down_proj.weight": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.81.down_proj.weight_scale": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.81.gate_proj.weight": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.81.gate_proj.weight_scale": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.81.up_proj.weight": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.81.up_proj.weight_scale": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.82.down_proj.weight": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.82.down_proj.weight_scale": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.82.gate_proj.weight": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.82.gate_proj.weight_scale": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.82.up_proj.weight": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.82.up_proj.weight_scale": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.83.down_proj.weight": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.83.down_proj.weight_scale": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.83.gate_proj.weight": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.83.gate_proj.weight_scale": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.83.up_proj.weight": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.83.up_proj.weight_scale": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.84.down_proj.weight": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.84.down_proj.weight_scale": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.84.gate_proj.weight": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.84.gate_proj.weight_scale": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.84.up_proj.weight": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.84.up_proj.weight_scale": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.85.down_proj.weight": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.85.down_proj.weight_scale": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.85.gate_proj.weight": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.85.gate_proj.weight_scale": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.85.up_proj.weight": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.85.up_proj.weight_scale": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.86.down_proj.weight": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.86.down_proj.weight_scale": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.86.gate_proj.weight": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.86.gate_proj.weight_scale": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.86.up_proj.weight": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.86.up_proj.weight_scale": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.87.down_proj.weight": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.87.down_proj.weight_scale": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.87.gate_proj.weight": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.87.gate_proj.weight_scale": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.87.up_proj.weight": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.87.up_proj.weight_scale": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.88.down_proj.weight": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.88.down_proj.weight_scale": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.88.gate_proj.weight": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.88.gate_proj.weight_scale": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.88.up_proj.weight": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.88.up_proj.weight_scale": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.89.down_proj.weight": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.89.down_proj.weight_scale": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.89.gate_proj.weight": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.89.gate_proj.weight_scale": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.89.up_proj.weight": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.89.up_proj.weight_scale": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.9.down_proj.weight": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.9.down_proj.weight_scale": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.9.gate_proj.weight": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.9.gate_proj.weight_scale": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.9.up_proj.weight": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.9.up_proj.weight_scale": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.90.down_proj.weight": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.90.down_proj.weight_scale": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.90.gate_proj.weight": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.90.gate_proj.weight_scale": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.90.up_proj.weight": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.90.up_proj.weight_scale": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.91.down_proj.weight": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.91.down_proj.weight_scale": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.91.gate_proj.weight": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.91.gate_proj.weight_scale": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.91.up_proj.weight": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.91.up_proj.weight_scale": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.92.down_proj.weight": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.92.down_proj.weight_scale": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.92.gate_proj.weight": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.92.gate_proj.weight_scale": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.92.up_proj.weight": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.92.up_proj.weight_scale": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.93.down_proj.weight": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.93.down_proj.weight_scale": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.93.gate_proj.weight": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.93.gate_proj.weight_scale": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.93.up_proj.weight": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.93.up_proj.weight_scale": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.94.down_proj.weight": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.94.down_proj.weight_scale": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.94.gate_proj.weight": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.94.gate_proj.weight_scale": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.94.up_proj.weight": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.94.up_proj.weight_scale": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.95.down_proj.weight": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.95.down_proj.weight_scale": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.95.gate_proj.weight": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.95.gate_proj.weight_scale": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.95.up_proj.weight": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.95.up_proj.weight_scale": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.96.down_proj.weight": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.96.down_proj.weight_scale": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.96.gate_proj.weight": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.96.gate_proj.weight_scale": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.96.up_proj.weight": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.96.up_proj.weight_scale": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.97.down_proj.weight": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.97.down_proj.weight_scale": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.97.gate_proj.weight": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.97.gate_proj.weight_scale": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.97.up_proj.weight": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.97.up_proj.weight_scale": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.98.down_proj.weight": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.98.down_proj.weight_scale": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.98.gate_proj.weight": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.98.gate_proj.weight_scale": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.98.up_proj.weight": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.98.up_proj.weight_scale": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.99.down_proj.weight": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.99.down_proj.weight_scale": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.99.gate_proj.weight": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.99.gate_proj.weight_scale": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.99.up_proj.weight": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.99.up_proj.weight_scale": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.gate.e_score_correction_bias": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.gate.weight": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.shared_experts.down_proj.weight": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.shared_experts.down_proj.weight_scale": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.shared_experts.gate_proj.weight": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.shared_experts.gate_proj.weight_scale": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.shared_experts.up_proj.weight": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.shared_experts.up_proj.weight_scale": "model-00080-of-00092.safetensors",
+ "model.layers.79.post_attention_layernorm.weight": "model-00080-of-00092.safetensors",
+ "model.layers.79.self_attn.k_norm.weight": "model-00080-of-00092.safetensors",
+ "model.layers.79.self_attn.k_proj.bias": "model-00080-of-00092.safetensors",
+ "model.layers.79.self_attn.k_proj.weight": "model-00080-of-00092.safetensors",
+ "model.layers.79.self_attn.k_proj.weight_scale": "model-00080-of-00092.safetensors",
+ "model.layers.79.self_attn.o_proj.weight": "model-00080-of-00092.safetensors",
+ "model.layers.79.self_attn.o_proj.weight_scale": "model-00080-of-00092.safetensors",
+ "model.layers.79.self_attn.q_norm.weight": "model-00080-of-00092.safetensors",
+ "model.layers.79.self_attn.q_proj.bias": "model-00080-of-00092.safetensors",
+ "model.layers.79.self_attn.q_proj.weight": "model-00080-of-00092.safetensors",
+ "model.layers.79.self_attn.q_proj.weight_scale": "model-00080-of-00092.safetensors",
+ "model.layers.79.self_attn.v_proj.bias": "model-00080-of-00092.safetensors",
+ "model.layers.79.self_attn.v_proj.weight": "model-00080-of-00092.safetensors",
+ "model.layers.79.self_attn.v_proj.weight_scale": "model-00080-of-00092.safetensors",
+ "model.layers.80.input_layernorm.weight": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.0.down_proj.weight": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.0.down_proj.weight_scale": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.0.gate_proj.weight": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.0.gate_proj.weight_scale": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.0.up_proj.weight": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.0.up_proj.weight_scale": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.1.down_proj.weight": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.1.down_proj.weight_scale": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.1.gate_proj.weight": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.1.gate_proj.weight_scale": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.1.up_proj.weight": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.1.up_proj.weight_scale": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.10.down_proj.weight": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.10.down_proj.weight_scale": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.10.gate_proj.weight": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.10.gate_proj.weight_scale": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.10.up_proj.weight": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.10.up_proj.weight_scale": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.100.down_proj.weight": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.100.down_proj.weight_scale": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.100.gate_proj.weight": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.100.gate_proj.weight_scale": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.100.up_proj.weight": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.100.up_proj.weight_scale": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.101.down_proj.weight": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.101.down_proj.weight_scale": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.101.gate_proj.weight": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.101.gate_proj.weight_scale": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.101.up_proj.weight": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.101.up_proj.weight_scale": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.102.down_proj.weight": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.102.down_proj.weight_scale": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.102.gate_proj.weight": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.102.gate_proj.weight_scale": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.102.up_proj.weight": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.102.up_proj.weight_scale": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.103.down_proj.weight": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.103.down_proj.weight_scale": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.103.gate_proj.weight": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.103.gate_proj.weight_scale": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.103.up_proj.weight": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.103.up_proj.weight_scale": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.104.down_proj.weight": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.104.down_proj.weight_scale": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.104.gate_proj.weight": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.104.gate_proj.weight_scale": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.104.up_proj.weight": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.104.up_proj.weight_scale": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.105.down_proj.weight": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.105.down_proj.weight_scale": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.105.gate_proj.weight": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.105.gate_proj.weight_scale": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.105.up_proj.weight": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.105.up_proj.weight_scale": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.106.down_proj.weight": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.106.down_proj.weight_scale": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.106.gate_proj.weight": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.106.gate_proj.weight_scale": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.106.up_proj.weight": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.106.up_proj.weight_scale": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.107.down_proj.weight": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.107.down_proj.weight_scale": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.107.gate_proj.weight": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.107.gate_proj.weight_scale": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.107.up_proj.weight": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.107.up_proj.weight_scale": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.108.down_proj.weight": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.108.down_proj.weight_scale": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.108.gate_proj.weight": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.108.gate_proj.weight_scale": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.108.up_proj.weight": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.108.up_proj.weight_scale": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.109.down_proj.weight": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.109.down_proj.weight_scale": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.109.gate_proj.weight": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.109.gate_proj.weight_scale": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.109.up_proj.weight": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.109.up_proj.weight_scale": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.11.down_proj.weight": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.11.down_proj.weight_scale": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.11.gate_proj.weight": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.11.gate_proj.weight_scale": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.11.up_proj.weight": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.11.up_proj.weight_scale": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.110.down_proj.weight": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.110.down_proj.weight_scale": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.110.gate_proj.weight": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.110.gate_proj.weight_scale": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.110.up_proj.weight": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.110.up_proj.weight_scale": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.111.down_proj.weight": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.111.down_proj.weight_scale": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.111.gate_proj.weight": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.111.gate_proj.weight_scale": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.111.up_proj.weight": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.111.up_proj.weight_scale": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.112.down_proj.weight": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.112.down_proj.weight_scale": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.112.gate_proj.weight": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.112.gate_proj.weight_scale": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.112.up_proj.weight": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.112.up_proj.weight_scale": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.113.down_proj.weight": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.113.down_proj.weight_scale": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.113.gate_proj.weight": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.113.gate_proj.weight_scale": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.113.up_proj.weight": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.113.up_proj.weight_scale": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.114.down_proj.weight": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.114.down_proj.weight_scale": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.114.gate_proj.weight": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.114.gate_proj.weight_scale": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.114.up_proj.weight": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.114.up_proj.weight_scale": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.115.down_proj.weight": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.115.down_proj.weight_scale": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.115.gate_proj.weight": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.115.gate_proj.weight_scale": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.115.up_proj.weight": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.115.up_proj.weight_scale": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.116.down_proj.weight": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.116.down_proj.weight_scale": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.116.gate_proj.weight": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.116.gate_proj.weight_scale": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.116.up_proj.weight": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.116.up_proj.weight_scale": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.117.down_proj.weight": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.117.down_proj.weight_scale": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.117.gate_proj.weight": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.117.gate_proj.weight_scale": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.117.up_proj.weight": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.117.up_proj.weight_scale": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.118.down_proj.weight": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.118.down_proj.weight_scale": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.118.gate_proj.weight": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.118.gate_proj.weight_scale": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.118.up_proj.weight": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.118.up_proj.weight_scale": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.119.down_proj.weight": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.119.down_proj.weight_scale": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.119.gate_proj.weight": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.119.gate_proj.weight_scale": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.119.up_proj.weight": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.119.up_proj.weight_scale": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.12.down_proj.weight": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.12.down_proj.weight_scale": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.12.gate_proj.weight": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.12.gate_proj.weight_scale": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.12.up_proj.weight": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.12.up_proj.weight_scale": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.120.down_proj.weight": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.120.down_proj.weight_scale": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.120.gate_proj.weight": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.120.gate_proj.weight_scale": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.120.up_proj.weight": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.120.up_proj.weight_scale": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.121.down_proj.weight": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.121.down_proj.weight_scale": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.121.gate_proj.weight": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.121.gate_proj.weight_scale": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.121.up_proj.weight": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.121.up_proj.weight_scale": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.122.down_proj.weight": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.122.down_proj.weight_scale": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.122.gate_proj.weight": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.122.gate_proj.weight_scale": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.122.up_proj.weight": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.122.up_proj.weight_scale": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.123.down_proj.weight": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.123.down_proj.weight_scale": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.123.gate_proj.weight": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.123.gate_proj.weight_scale": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.123.up_proj.weight": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.123.up_proj.weight_scale": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.124.down_proj.weight": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.124.down_proj.weight_scale": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.124.gate_proj.weight": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.124.gate_proj.weight_scale": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.124.up_proj.weight": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.124.up_proj.weight_scale": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.125.down_proj.weight": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.125.down_proj.weight_scale": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.125.gate_proj.weight": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.125.gate_proj.weight_scale": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.125.up_proj.weight": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.125.up_proj.weight_scale": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.126.down_proj.weight": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.126.down_proj.weight_scale": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.126.gate_proj.weight": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.126.gate_proj.weight_scale": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.126.up_proj.weight": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.126.up_proj.weight_scale": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.127.down_proj.weight": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.127.down_proj.weight_scale": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.127.gate_proj.weight": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.127.gate_proj.weight_scale": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.127.up_proj.weight": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.127.up_proj.weight_scale": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.128.down_proj.weight": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.128.down_proj.weight_scale": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.128.gate_proj.weight": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.128.gate_proj.weight_scale": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.128.up_proj.weight": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.128.up_proj.weight_scale": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.129.down_proj.weight": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.129.down_proj.weight_scale": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.129.gate_proj.weight": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.129.gate_proj.weight_scale": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.129.up_proj.weight": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.129.up_proj.weight_scale": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.13.down_proj.weight": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.13.down_proj.weight_scale": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.13.gate_proj.weight": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.13.gate_proj.weight_scale": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.13.up_proj.weight": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.13.up_proj.weight_scale": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.130.down_proj.weight": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.130.down_proj.weight_scale": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.130.gate_proj.weight": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.130.gate_proj.weight_scale": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.130.up_proj.weight": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.130.up_proj.weight_scale": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.131.down_proj.weight": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.131.down_proj.weight_scale": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.131.gate_proj.weight": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.131.gate_proj.weight_scale": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.131.up_proj.weight": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.131.up_proj.weight_scale": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.132.down_proj.weight": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.132.down_proj.weight_scale": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.132.gate_proj.weight": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.132.gate_proj.weight_scale": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.132.up_proj.weight": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.132.up_proj.weight_scale": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.133.down_proj.weight": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.133.down_proj.weight_scale": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.133.gate_proj.weight": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.133.gate_proj.weight_scale": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.133.up_proj.weight": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.133.up_proj.weight_scale": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.134.down_proj.weight": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.134.down_proj.weight_scale": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.134.gate_proj.weight": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.134.gate_proj.weight_scale": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.134.up_proj.weight": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.134.up_proj.weight_scale": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.135.down_proj.weight": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.135.down_proj.weight_scale": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.135.gate_proj.weight": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.135.gate_proj.weight_scale": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.135.up_proj.weight": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.135.up_proj.weight_scale": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.136.down_proj.weight": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.136.down_proj.weight_scale": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.136.gate_proj.weight": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.136.gate_proj.weight_scale": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.136.up_proj.weight": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.136.up_proj.weight_scale": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.137.down_proj.weight": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.137.down_proj.weight_scale": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.137.gate_proj.weight": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.137.gate_proj.weight_scale": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.137.up_proj.weight": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.137.up_proj.weight_scale": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.138.down_proj.weight": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.138.down_proj.weight_scale": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.138.gate_proj.weight": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.138.gate_proj.weight_scale": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.138.up_proj.weight": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.138.up_proj.weight_scale": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.139.down_proj.weight": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.139.down_proj.weight_scale": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.139.gate_proj.weight": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.139.gate_proj.weight_scale": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.139.up_proj.weight": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.139.up_proj.weight_scale": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.14.down_proj.weight": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.14.down_proj.weight_scale": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.14.gate_proj.weight": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.14.gate_proj.weight_scale": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.14.up_proj.weight": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.14.up_proj.weight_scale": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.140.down_proj.weight": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.140.down_proj.weight_scale": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.140.gate_proj.weight": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.140.gate_proj.weight_scale": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.140.up_proj.weight": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.140.up_proj.weight_scale": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.141.down_proj.weight": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.141.down_proj.weight_scale": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.141.gate_proj.weight": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.141.gate_proj.weight_scale": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.141.up_proj.weight": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.141.up_proj.weight_scale": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.142.down_proj.weight": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.142.down_proj.weight_scale": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.142.gate_proj.weight": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.142.gate_proj.weight_scale": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.142.up_proj.weight": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.142.up_proj.weight_scale": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.143.down_proj.weight": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.143.down_proj.weight_scale": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.143.gate_proj.weight": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.143.gate_proj.weight_scale": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.143.up_proj.weight": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.143.up_proj.weight_scale": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.144.down_proj.weight": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.144.down_proj.weight_scale": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.144.gate_proj.weight": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.144.gate_proj.weight_scale": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.144.up_proj.weight": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.144.up_proj.weight_scale": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.145.down_proj.weight": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.145.down_proj.weight_scale": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.145.gate_proj.weight": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.145.gate_proj.weight_scale": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.145.up_proj.weight": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.145.up_proj.weight_scale": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.146.down_proj.weight": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.146.down_proj.weight_scale": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.146.gate_proj.weight": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.146.gate_proj.weight_scale": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.146.up_proj.weight": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.146.up_proj.weight_scale": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.147.down_proj.weight": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.147.down_proj.weight_scale": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.147.gate_proj.weight": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.147.gate_proj.weight_scale": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.147.up_proj.weight": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.147.up_proj.weight_scale": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.148.down_proj.weight": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.148.down_proj.weight_scale": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.148.gate_proj.weight": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.148.gate_proj.weight_scale": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.148.up_proj.weight": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.148.up_proj.weight_scale": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.149.down_proj.weight": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.149.down_proj.weight_scale": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.149.gate_proj.weight": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.149.gate_proj.weight_scale": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.149.up_proj.weight": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.149.up_proj.weight_scale": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.15.down_proj.weight": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.15.down_proj.weight_scale": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.15.gate_proj.weight": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.15.gate_proj.weight_scale": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.15.up_proj.weight": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.15.up_proj.weight_scale": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.150.down_proj.weight": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.150.down_proj.weight_scale": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.150.gate_proj.weight": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.150.gate_proj.weight_scale": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.150.up_proj.weight": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.150.up_proj.weight_scale": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.151.down_proj.weight": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.151.down_proj.weight_scale": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.151.gate_proj.weight": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.151.gate_proj.weight_scale": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.151.up_proj.weight": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.151.up_proj.weight_scale": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.152.down_proj.weight": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.152.down_proj.weight_scale": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.152.gate_proj.weight": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.152.gate_proj.weight_scale": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.152.up_proj.weight": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.152.up_proj.weight_scale": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.153.down_proj.weight": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.153.down_proj.weight_scale": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.153.gate_proj.weight": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.153.gate_proj.weight_scale": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.153.up_proj.weight": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.153.up_proj.weight_scale": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.154.down_proj.weight": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.154.down_proj.weight_scale": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.154.gate_proj.weight": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.154.gate_proj.weight_scale": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.154.up_proj.weight": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.154.up_proj.weight_scale": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.155.down_proj.weight": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.155.down_proj.weight_scale": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.155.gate_proj.weight": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.155.gate_proj.weight_scale": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.155.up_proj.weight": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.155.up_proj.weight_scale": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.156.down_proj.weight": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.156.down_proj.weight_scale": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.156.gate_proj.weight": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.156.gate_proj.weight_scale": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.156.up_proj.weight": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.156.up_proj.weight_scale": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.157.down_proj.weight": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.157.down_proj.weight_scale": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.157.gate_proj.weight": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.157.gate_proj.weight_scale": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.157.up_proj.weight": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.157.up_proj.weight_scale": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.158.down_proj.weight": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.158.down_proj.weight_scale": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.158.gate_proj.weight": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.158.gate_proj.weight_scale": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.158.up_proj.weight": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.158.up_proj.weight_scale": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.159.down_proj.weight": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.159.down_proj.weight_scale": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.159.gate_proj.weight": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.159.gate_proj.weight_scale": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.159.up_proj.weight": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.159.up_proj.weight_scale": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.16.down_proj.weight": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.16.down_proj.weight_scale": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.16.gate_proj.weight": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.16.gate_proj.weight_scale": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.16.up_proj.weight": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.16.up_proj.weight_scale": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.17.down_proj.weight": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.17.down_proj.weight_scale": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.17.gate_proj.weight": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.17.gate_proj.weight_scale": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.17.up_proj.weight": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.17.up_proj.weight_scale": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.18.down_proj.weight": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.18.down_proj.weight_scale": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.18.gate_proj.weight": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.18.gate_proj.weight_scale": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.18.up_proj.weight": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.18.up_proj.weight_scale": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.19.down_proj.weight": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.19.down_proj.weight_scale": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.19.gate_proj.weight": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.19.gate_proj.weight_scale": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.19.up_proj.weight": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.19.up_proj.weight_scale": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.2.down_proj.weight": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.2.down_proj.weight_scale": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.2.gate_proj.weight": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.2.gate_proj.weight_scale": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.2.up_proj.weight": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.2.up_proj.weight_scale": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.20.down_proj.weight": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.20.down_proj.weight_scale": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.20.gate_proj.weight": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.20.gate_proj.weight_scale": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.20.up_proj.weight": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.20.up_proj.weight_scale": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.21.down_proj.weight": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.21.down_proj.weight_scale": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.21.gate_proj.weight": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.21.gate_proj.weight_scale": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.21.up_proj.weight": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.21.up_proj.weight_scale": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.22.down_proj.weight": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.22.down_proj.weight_scale": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.22.gate_proj.weight": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.22.gate_proj.weight_scale": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.22.up_proj.weight": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.22.up_proj.weight_scale": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.23.down_proj.weight": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.23.down_proj.weight_scale": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.23.gate_proj.weight": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.23.gate_proj.weight_scale": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.23.up_proj.weight": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.23.up_proj.weight_scale": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.24.down_proj.weight": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.24.down_proj.weight_scale": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.24.gate_proj.weight": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.24.gate_proj.weight_scale": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.24.up_proj.weight": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.24.up_proj.weight_scale": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.25.down_proj.weight": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.25.down_proj.weight_scale": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.25.gate_proj.weight": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.25.gate_proj.weight_scale": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.25.up_proj.weight": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.25.up_proj.weight_scale": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.26.down_proj.weight": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.26.down_proj.weight_scale": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.26.gate_proj.weight": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.26.gate_proj.weight_scale": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.26.up_proj.weight": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.26.up_proj.weight_scale": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.27.down_proj.weight": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.27.down_proj.weight_scale": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.27.gate_proj.weight": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.27.gate_proj.weight_scale": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.27.up_proj.weight": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.27.up_proj.weight_scale": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.28.down_proj.weight": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.28.down_proj.weight_scale": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.28.gate_proj.weight": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.28.gate_proj.weight_scale": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.28.up_proj.weight": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.28.up_proj.weight_scale": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.29.down_proj.weight": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.29.down_proj.weight_scale": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.29.gate_proj.weight": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.29.gate_proj.weight_scale": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.29.up_proj.weight": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.29.up_proj.weight_scale": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.3.down_proj.weight": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.3.down_proj.weight_scale": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.3.gate_proj.weight": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.3.gate_proj.weight_scale": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.3.up_proj.weight": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.3.up_proj.weight_scale": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.30.down_proj.weight": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.30.down_proj.weight_scale": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.30.gate_proj.weight": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.30.gate_proj.weight_scale": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.30.up_proj.weight": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.30.up_proj.weight_scale": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.31.down_proj.weight": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.31.down_proj.weight_scale": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.31.gate_proj.weight": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.31.gate_proj.weight_scale": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.31.up_proj.weight": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.31.up_proj.weight_scale": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.32.down_proj.weight": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.32.down_proj.weight_scale": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.32.gate_proj.weight": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.32.gate_proj.weight_scale": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.32.up_proj.weight": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.32.up_proj.weight_scale": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.33.down_proj.weight": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.33.down_proj.weight_scale": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.33.gate_proj.weight": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.33.gate_proj.weight_scale": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.33.up_proj.weight": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.33.up_proj.weight_scale": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.34.down_proj.weight": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.34.down_proj.weight_scale": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.34.gate_proj.weight": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.34.gate_proj.weight_scale": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.34.up_proj.weight": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.34.up_proj.weight_scale": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.35.down_proj.weight": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.35.down_proj.weight_scale": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.35.gate_proj.weight": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.35.gate_proj.weight_scale": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.35.up_proj.weight": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.35.up_proj.weight_scale": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.36.down_proj.weight": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.36.down_proj.weight_scale": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.36.gate_proj.weight": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.36.gate_proj.weight_scale": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.36.up_proj.weight": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.36.up_proj.weight_scale": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.37.down_proj.weight": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.37.down_proj.weight_scale": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.37.gate_proj.weight": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.37.gate_proj.weight_scale": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.37.up_proj.weight": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.37.up_proj.weight_scale": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.38.down_proj.weight": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.38.down_proj.weight_scale": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.38.gate_proj.weight": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.38.gate_proj.weight_scale": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.38.up_proj.weight": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.38.up_proj.weight_scale": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.39.down_proj.weight": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.39.down_proj.weight_scale": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.39.gate_proj.weight": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.39.gate_proj.weight_scale": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.39.up_proj.weight": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.39.up_proj.weight_scale": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.4.down_proj.weight": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.4.down_proj.weight_scale": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.4.gate_proj.weight": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.4.gate_proj.weight_scale": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.4.up_proj.weight": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.4.up_proj.weight_scale": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.40.down_proj.weight": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.40.down_proj.weight_scale": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.40.gate_proj.weight": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.40.gate_proj.weight_scale": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.40.up_proj.weight": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.40.up_proj.weight_scale": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.41.down_proj.weight": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.41.down_proj.weight_scale": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.41.gate_proj.weight": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.41.gate_proj.weight_scale": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.41.up_proj.weight": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.41.up_proj.weight_scale": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.42.down_proj.weight": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.42.down_proj.weight_scale": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.42.gate_proj.weight": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.42.gate_proj.weight_scale": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.42.up_proj.weight": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.42.up_proj.weight_scale": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.43.down_proj.weight": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.43.down_proj.weight_scale": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.43.gate_proj.weight": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.43.gate_proj.weight_scale": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.43.up_proj.weight": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.43.up_proj.weight_scale": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.44.down_proj.weight": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.44.down_proj.weight_scale": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.44.gate_proj.weight": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.44.gate_proj.weight_scale": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.44.up_proj.weight": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.44.up_proj.weight_scale": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.45.down_proj.weight": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.45.down_proj.weight_scale": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.45.gate_proj.weight": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.45.gate_proj.weight_scale": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.45.up_proj.weight": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.45.up_proj.weight_scale": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.46.down_proj.weight": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.46.down_proj.weight_scale": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.46.gate_proj.weight": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.46.gate_proj.weight_scale": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.46.up_proj.weight": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.46.up_proj.weight_scale": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.47.down_proj.weight": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.47.down_proj.weight_scale": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.47.gate_proj.weight": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.47.gate_proj.weight_scale": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.47.up_proj.weight": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.47.up_proj.weight_scale": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.48.down_proj.weight": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.48.down_proj.weight_scale": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.48.gate_proj.weight": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.48.gate_proj.weight_scale": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.48.up_proj.weight": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.48.up_proj.weight_scale": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.49.down_proj.weight": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.49.down_proj.weight_scale": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.49.gate_proj.weight": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.49.gate_proj.weight_scale": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.49.up_proj.weight": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.49.up_proj.weight_scale": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.5.down_proj.weight": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.5.down_proj.weight_scale": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.5.gate_proj.weight": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.5.gate_proj.weight_scale": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.5.up_proj.weight": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.5.up_proj.weight_scale": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.50.down_proj.weight": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.50.down_proj.weight_scale": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.50.gate_proj.weight": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.50.gate_proj.weight_scale": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.50.up_proj.weight": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.50.up_proj.weight_scale": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.51.down_proj.weight": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.51.down_proj.weight_scale": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.51.gate_proj.weight": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.51.gate_proj.weight_scale": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.51.up_proj.weight": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.51.up_proj.weight_scale": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.52.down_proj.weight": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.52.down_proj.weight_scale": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.52.gate_proj.weight": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.52.gate_proj.weight_scale": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.52.up_proj.weight": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.52.up_proj.weight_scale": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.53.down_proj.weight": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.53.down_proj.weight_scale": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.53.gate_proj.weight": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.53.gate_proj.weight_scale": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.53.up_proj.weight": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.53.up_proj.weight_scale": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.54.down_proj.weight": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.54.down_proj.weight_scale": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.54.gate_proj.weight": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.54.gate_proj.weight_scale": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.54.up_proj.weight": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.54.up_proj.weight_scale": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.55.down_proj.weight": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.55.down_proj.weight_scale": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.55.gate_proj.weight": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.55.gate_proj.weight_scale": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.55.up_proj.weight": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.55.up_proj.weight_scale": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.56.down_proj.weight": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.56.down_proj.weight_scale": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.56.gate_proj.weight": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.56.gate_proj.weight_scale": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.56.up_proj.weight": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.56.up_proj.weight_scale": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.57.down_proj.weight": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.57.down_proj.weight_scale": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.57.gate_proj.weight": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.57.gate_proj.weight_scale": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.57.up_proj.weight": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.57.up_proj.weight_scale": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.58.down_proj.weight": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.58.down_proj.weight_scale": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.58.gate_proj.weight": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.58.gate_proj.weight_scale": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.58.up_proj.weight": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.58.up_proj.weight_scale": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.59.down_proj.weight": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.59.down_proj.weight_scale": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.59.gate_proj.weight": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.59.gate_proj.weight_scale": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.59.up_proj.weight": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.59.up_proj.weight_scale": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.6.down_proj.weight": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.6.down_proj.weight_scale": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.6.gate_proj.weight": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.6.gate_proj.weight_scale": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.6.up_proj.weight": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.6.up_proj.weight_scale": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.60.down_proj.weight": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.60.down_proj.weight_scale": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.60.gate_proj.weight": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.60.gate_proj.weight_scale": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.60.up_proj.weight": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.60.up_proj.weight_scale": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.61.down_proj.weight": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.61.down_proj.weight_scale": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.61.gate_proj.weight": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.61.gate_proj.weight_scale": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.61.up_proj.weight": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.61.up_proj.weight_scale": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.62.down_proj.weight": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.62.down_proj.weight_scale": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.62.gate_proj.weight": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.62.gate_proj.weight_scale": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.62.up_proj.weight": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.62.up_proj.weight_scale": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.63.down_proj.weight": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.63.down_proj.weight_scale": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.63.gate_proj.weight": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.63.gate_proj.weight_scale": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.63.up_proj.weight": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.63.up_proj.weight_scale": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.64.down_proj.weight": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.64.down_proj.weight_scale": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.64.gate_proj.weight": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.64.gate_proj.weight_scale": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.64.up_proj.weight": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.64.up_proj.weight_scale": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.65.down_proj.weight": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.65.down_proj.weight_scale": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.65.gate_proj.weight": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.65.gate_proj.weight_scale": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.65.up_proj.weight": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.65.up_proj.weight_scale": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.66.down_proj.weight": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.66.down_proj.weight_scale": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.66.gate_proj.weight": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.66.gate_proj.weight_scale": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.66.up_proj.weight": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.66.up_proj.weight_scale": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.67.down_proj.weight": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.67.down_proj.weight_scale": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.67.gate_proj.weight": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.67.gate_proj.weight_scale": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.67.up_proj.weight": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.67.up_proj.weight_scale": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.68.down_proj.weight": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.68.down_proj.weight_scale": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.68.gate_proj.weight": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.68.gate_proj.weight_scale": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.68.up_proj.weight": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.68.up_proj.weight_scale": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.69.down_proj.weight": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.69.down_proj.weight_scale": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.69.gate_proj.weight": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.69.gate_proj.weight_scale": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.69.up_proj.weight": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.69.up_proj.weight_scale": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.7.down_proj.weight": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.7.down_proj.weight_scale": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.7.gate_proj.weight": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.7.gate_proj.weight_scale": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.7.up_proj.weight": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.7.up_proj.weight_scale": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.70.down_proj.weight": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.70.down_proj.weight_scale": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.70.gate_proj.weight": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.70.gate_proj.weight_scale": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.70.up_proj.weight": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.70.up_proj.weight_scale": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.71.down_proj.weight": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.71.down_proj.weight_scale": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.71.gate_proj.weight": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.71.gate_proj.weight_scale": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.71.up_proj.weight": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.71.up_proj.weight_scale": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.72.down_proj.weight": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.72.down_proj.weight_scale": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.72.gate_proj.weight": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.72.gate_proj.weight_scale": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.72.up_proj.weight": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.72.up_proj.weight_scale": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.73.down_proj.weight": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.73.down_proj.weight_scale": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.73.gate_proj.weight": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.73.gate_proj.weight_scale": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.73.up_proj.weight": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.73.up_proj.weight_scale": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.74.down_proj.weight": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.74.down_proj.weight_scale": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.74.gate_proj.weight": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.74.gate_proj.weight_scale": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.74.up_proj.weight": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.74.up_proj.weight_scale": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.75.down_proj.weight": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.75.down_proj.weight_scale": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.75.gate_proj.weight": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.75.gate_proj.weight_scale": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.75.up_proj.weight": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.75.up_proj.weight_scale": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.76.down_proj.weight": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.76.down_proj.weight_scale": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.76.gate_proj.weight": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.76.gate_proj.weight_scale": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.76.up_proj.weight": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.76.up_proj.weight_scale": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.77.down_proj.weight": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.77.down_proj.weight_scale": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.77.gate_proj.weight": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.77.gate_proj.weight_scale": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.77.up_proj.weight": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.77.up_proj.weight_scale": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.78.down_proj.weight": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.78.down_proj.weight_scale": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.78.gate_proj.weight": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.78.gate_proj.weight_scale": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.78.up_proj.weight": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.78.up_proj.weight_scale": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.79.down_proj.weight": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.79.down_proj.weight_scale": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.79.gate_proj.weight": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.79.gate_proj.weight_scale": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.79.up_proj.weight": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.79.up_proj.weight_scale": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.8.down_proj.weight": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.8.down_proj.weight_scale": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.8.gate_proj.weight": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.8.gate_proj.weight_scale": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.8.up_proj.weight": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.8.up_proj.weight_scale": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.80.down_proj.weight": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.80.down_proj.weight_scale": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.80.gate_proj.weight": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.80.gate_proj.weight_scale": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.80.up_proj.weight": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.80.up_proj.weight_scale": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.81.down_proj.weight": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.81.down_proj.weight_scale": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.81.gate_proj.weight": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.81.gate_proj.weight_scale": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.81.up_proj.weight": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.81.up_proj.weight_scale": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.82.down_proj.weight": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.82.down_proj.weight_scale": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.82.gate_proj.weight": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.82.gate_proj.weight_scale": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.82.up_proj.weight": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.82.up_proj.weight_scale": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.83.down_proj.weight": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.83.down_proj.weight_scale": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.83.gate_proj.weight": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.83.gate_proj.weight_scale": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.83.up_proj.weight": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.83.up_proj.weight_scale": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.84.down_proj.weight": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.84.down_proj.weight_scale": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.84.gate_proj.weight": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.84.gate_proj.weight_scale": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.84.up_proj.weight": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.84.up_proj.weight_scale": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.85.down_proj.weight": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.85.down_proj.weight_scale": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.85.gate_proj.weight": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.85.gate_proj.weight_scale": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.85.up_proj.weight": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.85.up_proj.weight_scale": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.86.down_proj.weight": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.86.down_proj.weight_scale": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.86.gate_proj.weight": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.86.gate_proj.weight_scale": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.86.up_proj.weight": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.86.up_proj.weight_scale": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.87.down_proj.weight": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.87.down_proj.weight_scale": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.87.gate_proj.weight": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.87.gate_proj.weight_scale": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.87.up_proj.weight": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.87.up_proj.weight_scale": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.88.down_proj.weight": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.88.down_proj.weight_scale": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.88.gate_proj.weight": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.88.gate_proj.weight_scale": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.88.up_proj.weight": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.88.up_proj.weight_scale": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.89.down_proj.weight": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.89.down_proj.weight_scale": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.89.gate_proj.weight": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.89.gate_proj.weight_scale": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.89.up_proj.weight": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.89.up_proj.weight_scale": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.9.down_proj.weight": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.9.down_proj.weight_scale": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.9.gate_proj.weight": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.9.gate_proj.weight_scale": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.9.up_proj.weight": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.9.up_proj.weight_scale": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.90.down_proj.weight": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.90.down_proj.weight_scale": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.90.gate_proj.weight": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.90.gate_proj.weight_scale": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.90.up_proj.weight": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.90.up_proj.weight_scale": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.91.down_proj.weight": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.91.down_proj.weight_scale": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.91.gate_proj.weight": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.91.gate_proj.weight_scale": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.91.up_proj.weight": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.91.up_proj.weight_scale": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.92.down_proj.weight": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.92.down_proj.weight_scale": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.92.gate_proj.weight": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.92.gate_proj.weight_scale": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.92.up_proj.weight": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.92.up_proj.weight_scale": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.93.down_proj.weight": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.93.down_proj.weight_scale": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.93.gate_proj.weight": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.93.gate_proj.weight_scale": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.93.up_proj.weight": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.93.up_proj.weight_scale": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.94.down_proj.weight": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.94.down_proj.weight_scale": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.94.gate_proj.weight": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.94.gate_proj.weight_scale": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.94.up_proj.weight": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.94.up_proj.weight_scale": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.95.down_proj.weight": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.95.down_proj.weight_scale": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.95.gate_proj.weight": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.95.gate_proj.weight_scale": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.95.up_proj.weight": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.95.up_proj.weight_scale": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.96.down_proj.weight": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.96.down_proj.weight_scale": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.96.gate_proj.weight": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.96.gate_proj.weight_scale": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.96.up_proj.weight": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.96.up_proj.weight_scale": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.97.down_proj.weight": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.97.down_proj.weight_scale": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.97.gate_proj.weight": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.97.gate_proj.weight_scale": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.97.up_proj.weight": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.97.up_proj.weight_scale": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.98.down_proj.weight": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.98.down_proj.weight_scale": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.98.gate_proj.weight": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.98.gate_proj.weight_scale": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.98.up_proj.weight": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.98.up_proj.weight_scale": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.99.down_proj.weight": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.99.down_proj.weight_scale": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.99.gate_proj.weight": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.99.gate_proj.weight_scale": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.99.up_proj.weight": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.99.up_proj.weight_scale": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.gate.e_score_correction_bias": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.gate.weight": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.shared_experts.down_proj.weight": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.shared_experts.down_proj.weight_scale": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.shared_experts.gate_proj.weight": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.shared_experts.gate_proj.weight_scale": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.shared_experts.up_proj.weight": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.shared_experts.up_proj.weight_scale": "model-00081-of-00092.safetensors",
+ "model.layers.80.post_attention_layernorm.weight": "model-00081-of-00092.safetensors",
+ "model.layers.80.self_attn.k_norm.weight": "model-00081-of-00092.safetensors",
+ "model.layers.80.self_attn.k_proj.bias": "model-00081-of-00092.safetensors",
+ "model.layers.80.self_attn.k_proj.weight": "model-00081-of-00092.safetensors",
+ "model.layers.80.self_attn.k_proj.weight_scale": "model-00081-of-00092.safetensors",
+ "model.layers.80.self_attn.o_proj.weight": "model-00081-of-00092.safetensors",
+ "model.layers.80.self_attn.o_proj.weight_scale": "model-00081-of-00092.safetensors",
+ "model.layers.80.self_attn.q_norm.weight": "model-00081-of-00092.safetensors",
+ "model.layers.80.self_attn.q_proj.bias": "model-00081-of-00092.safetensors",
+ "model.layers.80.self_attn.q_proj.weight": "model-00081-of-00092.safetensors",
+ "model.layers.80.self_attn.q_proj.weight_scale": "model-00081-of-00092.safetensors",
+ "model.layers.80.self_attn.v_proj.bias": "model-00081-of-00092.safetensors",
+ "model.layers.80.self_attn.v_proj.weight": "model-00081-of-00092.safetensors",
+ "model.layers.80.self_attn.v_proj.weight_scale": "model-00081-of-00092.safetensors",
+ "model.layers.81.input_layernorm.weight": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.0.down_proj.weight": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.0.down_proj.weight_scale": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.0.gate_proj.weight": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.0.gate_proj.weight_scale": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.0.up_proj.weight": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.0.up_proj.weight_scale": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.1.down_proj.weight": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.1.down_proj.weight_scale": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.1.gate_proj.weight": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.1.gate_proj.weight_scale": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.1.up_proj.weight": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.1.up_proj.weight_scale": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.10.down_proj.weight": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.10.down_proj.weight_scale": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.10.gate_proj.weight": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.10.gate_proj.weight_scale": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.10.up_proj.weight": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.10.up_proj.weight_scale": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.100.down_proj.weight": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.100.down_proj.weight_scale": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.100.gate_proj.weight": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.100.gate_proj.weight_scale": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.100.up_proj.weight": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.100.up_proj.weight_scale": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.101.down_proj.weight": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.101.down_proj.weight_scale": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.101.gate_proj.weight": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.101.gate_proj.weight_scale": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.101.up_proj.weight": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.101.up_proj.weight_scale": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.102.down_proj.weight": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.102.down_proj.weight_scale": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.102.gate_proj.weight": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.102.gate_proj.weight_scale": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.102.up_proj.weight": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.102.up_proj.weight_scale": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.103.down_proj.weight": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.103.down_proj.weight_scale": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.103.gate_proj.weight": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.103.gate_proj.weight_scale": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.103.up_proj.weight": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.103.up_proj.weight_scale": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.104.down_proj.weight": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.104.down_proj.weight_scale": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.104.gate_proj.weight": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.104.gate_proj.weight_scale": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.104.up_proj.weight": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.104.up_proj.weight_scale": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.105.down_proj.weight": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.105.down_proj.weight_scale": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.105.gate_proj.weight": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.105.gate_proj.weight_scale": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.105.up_proj.weight": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.105.up_proj.weight_scale": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.106.down_proj.weight": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.106.down_proj.weight_scale": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.106.gate_proj.weight": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.106.gate_proj.weight_scale": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.106.up_proj.weight": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.106.up_proj.weight_scale": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.107.down_proj.weight": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.107.down_proj.weight_scale": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.107.gate_proj.weight": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.107.gate_proj.weight_scale": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.107.up_proj.weight": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.107.up_proj.weight_scale": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.108.down_proj.weight": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.108.down_proj.weight_scale": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.108.gate_proj.weight": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.108.gate_proj.weight_scale": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.108.up_proj.weight": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.108.up_proj.weight_scale": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.109.down_proj.weight": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.109.down_proj.weight_scale": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.109.gate_proj.weight": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.109.gate_proj.weight_scale": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.109.up_proj.weight": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.109.up_proj.weight_scale": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.11.down_proj.weight": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.11.down_proj.weight_scale": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.11.gate_proj.weight": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.11.gate_proj.weight_scale": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.11.up_proj.weight": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.11.up_proj.weight_scale": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.110.down_proj.weight": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.110.down_proj.weight_scale": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.110.gate_proj.weight": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.110.gate_proj.weight_scale": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.110.up_proj.weight": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.110.up_proj.weight_scale": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.111.down_proj.weight": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.111.down_proj.weight_scale": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.111.gate_proj.weight": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.111.gate_proj.weight_scale": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.111.up_proj.weight": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.111.up_proj.weight_scale": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.112.down_proj.weight": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.112.down_proj.weight_scale": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.112.gate_proj.weight": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.112.gate_proj.weight_scale": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.112.up_proj.weight": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.112.up_proj.weight_scale": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.113.down_proj.weight": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.113.down_proj.weight_scale": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.113.gate_proj.weight": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.113.gate_proj.weight_scale": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.113.up_proj.weight": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.113.up_proj.weight_scale": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.114.down_proj.weight": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.114.down_proj.weight_scale": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.114.gate_proj.weight": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.114.gate_proj.weight_scale": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.114.up_proj.weight": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.114.up_proj.weight_scale": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.115.down_proj.weight": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.115.down_proj.weight_scale": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.115.gate_proj.weight": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.115.gate_proj.weight_scale": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.115.up_proj.weight": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.115.up_proj.weight_scale": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.116.down_proj.weight": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.116.down_proj.weight_scale": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.116.gate_proj.weight": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.116.gate_proj.weight_scale": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.116.up_proj.weight": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.116.up_proj.weight_scale": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.117.down_proj.weight": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.117.down_proj.weight_scale": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.117.gate_proj.weight": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.117.gate_proj.weight_scale": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.117.up_proj.weight": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.117.up_proj.weight_scale": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.118.down_proj.weight": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.118.down_proj.weight_scale": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.118.gate_proj.weight": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.118.gate_proj.weight_scale": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.118.up_proj.weight": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.118.up_proj.weight_scale": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.119.down_proj.weight": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.119.down_proj.weight_scale": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.119.gate_proj.weight": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.119.gate_proj.weight_scale": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.119.up_proj.weight": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.119.up_proj.weight_scale": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.12.down_proj.weight": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.12.down_proj.weight_scale": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.12.gate_proj.weight": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.12.gate_proj.weight_scale": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.12.up_proj.weight": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.12.up_proj.weight_scale": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.120.down_proj.weight": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.120.down_proj.weight_scale": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.120.gate_proj.weight": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.120.gate_proj.weight_scale": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.120.up_proj.weight": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.120.up_proj.weight_scale": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.121.down_proj.weight": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.121.down_proj.weight_scale": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.121.gate_proj.weight": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.121.gate_proj.weight_scale": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.121.up_proj.weight": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.121.up_proj.weight_scale": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.122.down_proj.weight": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.122.down_proj.weight_scale": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.122.gate_proj.weight": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.122.gate_proj.weight_scale": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.122.up_proj.weight": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.122.up_proj.weight_scale": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.123.down_proj.weight": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.123.down_proj.weight_scale": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.123.gate_proj.weight": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.123.gate_proj.weight_scale": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.123.up_proj.weight": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.123.up_proj.weight_scale": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.124.down_proj.weight": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.124.down_proj.weight_scale": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.124.gate_proj.weight": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.124.gate_proj.weight_scale": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.124.up_proj.weight": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.124.up_proj.weight_scale": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.125.down_proj.weight": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.125.down_proj.weight_scale": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.125.gate_proj.weight": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.125.gate_proj.weight_scale": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.125.up_proj.weight": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.125.up_proj.weight_scale": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.126.down_proj.weight": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.126.down_proj.weight_scale": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.126.gate_proj.weight": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.126.gate_proj.weight_scale": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.126.up_proj.weight": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.126.up_proj.weight_scale": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.127.down_proj.weight": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.127.down_proj.weight_scale": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.127.gate_proj.weight": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.127.gate_proj.weight_scale": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.127.up_proj.weight": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.127.up_proj.weight_scale": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.128.down_proj.weight": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.128.down_proj.weight_scale": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.128.gate_proj.weight": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.128.gate_proj.weight_scale": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.128.up_proj.weight": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.128.up_proj.weight_scale": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.129.down_proj.weight": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.129.down_proj.weight_scale": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.129.gate_proj.weight": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.129.gate_proj.weight_scale": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.129.up_proj.weight": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.129.up_proj.weight_scale": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.13.down_proj.weight": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.13.down_proj.weight_scale": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.13.gate_proj.weight": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.13.gate_proj.weight_scale": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.13.up_proj.weight": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.13.up_proj.weight_scale": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.130.down_proj.weight": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.130.down_proj.weight_scale": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.130.gate_proj.weight": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.130.gate_proj.weight_scale": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.130.up_proj.weight": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.130.up_proj.weight_scale": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.131.down_proj.weight": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.131.down_proj.weight_scale": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.131.gate_proj.weight": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.131.gate_proj.weight_scale": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.131.up_proj.weight": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.131.up_proj.weight_scale": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.132.down_proj.weight": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.132.down_proj.weight_scale": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.132.gate_proj.weight": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.132.gate_proj.weight_scale": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.132.up_proj.weight": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.132.up_proj.weight_scale": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.133.down_proj.weight": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.133.down_proj.weight_scale": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.133.gate_proj.weight": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.133.gate_proj.weight_scale": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.133.up_proj.weight": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.133.up_proj.weight_scale": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.134.down_proj.weight": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.134.down_proj.weight_scale": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.134.gate_proj.weight": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.134.gate_proj.weight_scale": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.134.up_proj.weight": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.134.up_proj.weight_scale": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.135.down_proj.weight": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.135.down_proj.weight_scale": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.135.gate_proj.weight": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.135.gate_proj.weight_scale": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.135.up_proj.weight": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.135.up_proj.weight_scale": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.136.down_proj.weight": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.136.down_proj.weight_scale": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.136.gate_proj.weight": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.136.gate_proj.weight_scale": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.136.up_proj.weight": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.136.up_proj.weight_scale": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.137.down_proj.weight": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.137.down_proj.weight_scale": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.137.gate_proj.weight": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.137.gate_proj.weight_scale": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.137.up_proj.weight": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.137.up_proj.weight_scale": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.138.down_proj.weight": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.138.down_proj.weight_scale": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.138.gate_proj.weight": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.138.gate_proj.weight_scale": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.138.up_proj.weight": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.138.up_proj.weight_scale": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.139.down_proj.weight": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.139.down_proj.weight_scale": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.139.gate_proj.weight": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.139.gate_proj.weight_scale": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.139.up_proj.weight": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.139.up_proj.weight_scale": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.14.down_proj.weight": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.14.down_proj.weight_scale": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.14.gate_proj.weight": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.14.gate_proj.weight_scale": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.14.up_proj.weight": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.14.up_proj.weight_scale": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.140.down_proj.weight": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.140.down_proj.weight_scale": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.140.gate_proj.weight": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.140.gate_proj.weight_scale": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.140.up_proj.weight": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.140.up_proj.weight_scale": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.141.down_proj.weight": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.141.down_proj.weight_scale": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.141.gate_proj.weight": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.141.gate_proj.weight_scale": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.141.up_proj.weight": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.141.up_proj.weight_scale": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.142.down_proj.weight": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.142.down_proj.weight_scale": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.142.gate_proj.weight": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.142.gate_proj.weight_scale": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.142.up_proj.weight": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.142.up_proj.weight_scale": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.143.down_proj.weight": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.143.down_proj.weight_scale": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.143.gate_proj.weight": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.143.gate_proj.weight_scale": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.143.up_proj.weight": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.143.up_proj.weight_scale": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.144.down_proj.weight": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.144.down_proj.weight_scale": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.144.gate_proj.weight": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.144.gate_proj.weight_scale": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.144.up_proj.weight": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.144.up_proj.weight_scale": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.145.down_proj.weight": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.145.down_proj.weight_scale": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.145.gate_proj.weight": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.145.gate_proj.weight_scale": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.145.up_proj.weight": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.145.up_proj.weight_scale": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.146.down_proj.weight": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.146.down_proj.weight_scale": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.146.gate_proj.weight": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.146.gate_proj.weight_scale": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.146.up_proj.weight": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.146.up_proj.weight_scale": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.147.down_proj.weight": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.147.down_proj.weight_scale": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.147.gate_proj.weight": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.147.gate_proj.weight_scale": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.147.up_proj.weight": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.147.up_proj.weight_scale": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.148.down_proj.weight": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.148.down_proj.weight_scale": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.148.gate_proj.weight": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.148.gate_proj.weight_scale": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.148.up_proj.weight": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.148.up_proj.weight_scale": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.149.down_proj.weight": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.149.down_proj.weight_scale": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.149.gate_proj.weight": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.149.gate_proj.weight_scale": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.149.up_proj.weight": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.149.up_proj.weight_scale": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.15.down_proj.weight": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.15.down_proj.weight_scale": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.15.gate_proj.weight": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.15.gate_proj.weight_scale": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.15.up_proj.weight": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.15.up_proj.weight_scale": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.150.down_proj.weight": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.150.down_proj.weight_scale": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.150.gate_proj.weight": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.150.gate_proj.weight_scale": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.150.up_proj.weight": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.150.up_proj.weight_scale": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.151.down_proj.weight": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.151.down_proj.weight_scale": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.151.gate_proj.weight": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.151.gate_proj.weight_scale": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.151.up_proj.weight": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.151.up_proj.weight_scale": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.152.down_proj.weight": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.152.down_proj.weight_scale": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.152.gate_proj.weight": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.152.gate_proj.weight_scale": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.152.up_proj.weight": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.152.up_proj.weight_scale": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.153.down_proj.weight": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.153.down_proj.weight_scale": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.153.gate_proj.weight": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.153.gate_proj.weight_scale": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.153.up_proj.weight": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.153.up_proj.weight_scale": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.154.down_proj.weight": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.154.down_proj.weight_scale": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.154.gate_proj.weight": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.154.gate_proj.weight_scale": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.154.up_proj.weight": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.154.up_proj.weight_scale": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.155.down_proj.weight": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.155.down_proj.weight_scale": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.155.gate_proj.weight": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.155.gate_proj.weight_scale": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.155.up_proj.weight": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.155.up_proj.weight_scale": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.156.down_proj.weight": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.156.down_proj.weight_scale": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.156.gate_proj.weight": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.156.gate_proj.weight_scale": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.156.up_proj.weight": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.156.up_proj.weight_scale": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.157.down_proj.weight": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.157.down_proj.weight_scale": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.157.gate_proj.weight": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.157.gate_proj.weight_scale": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.157.up_proj.weight": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.157.up_proj.weight_scale": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.158.down_proj.weight": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.158.down_proj.weight_scale": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.158.gate_proj.weight": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.158.gate_proj.weight_scale": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.158.up_proj.weight": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.158.up_proj.weight_scale": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.159.down_proj.weight": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.159.down_proj.weight_scale": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.159.gate_proj.weight": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.159.gate_proj.weight_scale": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.159.up_proj.weight": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.159.up_proj.weight_scale": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.16.down_proj.weight": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.16.down_proj.weight_scale": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.16.gate_proj.weight": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.16.gate_proj.weight_scale": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.16.up_proj.weight": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.16.up_proj.weight_scale": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.17.down_proj.weight": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.17.down_proj.weight_scale": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.17.gate_proj.weight": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.17.gate_proj.weight_scale": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.17.up_proj.weight": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.17.up_proj.weight_scale": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.18.down_proj.weight": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.18.down_proj.weight_scale": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.18.gate_proj.weight": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.18.gate_proj.weight_scale": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.18.up_proj.weight": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.18.up_proj.weight_scale": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.19.down_proj.weight": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.19.down_proj.weight_scale": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.19.gate_proj.weight": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.19.gate_proj.weight_scale": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.19.up_proj.weight": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.19.up_proj.weight_scale": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.2.down_proj.weight": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.2.down_proj.weight_scale": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.2.gate_proj.weight": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.2.gate_proj.weight_scale": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.2.up_proj.weight": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.2.up_proj.weight_scale": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.20.down_proj.weight": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.20.down_proj.weight_scale": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.20.gate_proj.weight": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.20.gate_proj.weight_scale": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.20.up_proj.weight": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.20.up_proj.weight_scale": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.21.down_proj.weight": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.21.down_proj.weight_scale": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.21.gate_proj.weight": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.21.gate_proj.weight_scale": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.21.up_proj.weight": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.21.up_proj.weight_scale": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.22.down_proj.weight": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.22.down_proj.weight_scale": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.22.gate_proj.weight": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.22.gate_proj.weight_scale": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.22.up_proj.weight": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.22.up_proj.weight_scale": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.23.down_proj.weight": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.23.down_proj.weight_scale": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.23.gate_proj.weight": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.23.gate_proj.weight_scale": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.23.up_proj.weight": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.23.up_proj.weight_scale": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.24.down_proj.weight": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.24.down_proj.weight_scale": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.24.gate_proj.weight": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.24.gate_proj.weight_scale": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.24.up_proj.weight": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.24.up_proj.weight_scale": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.25.down_proj.weight": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.25.down_proj.weight_scale": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.25.gate_proj.weight": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.25.gate_proj.weight_scale": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.25.up_proj.weight": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.25.up_proj.weight_scale": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.26.down_proj.weight": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.26.down_proj.weight_scale": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.26.gate_proj.weight": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.26.gate_proj.weight_scale": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.26.up_proj.weight": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.26.up_proj.weight_scale": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.27.down_proj.weight": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.27.down_proj.weight_scale": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.27.gate_proj.weight": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.27.gate_proj.weight_scale": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.27.up_proj.weight": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.27.up_proj.weight_scale": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.28.down_proj.weight": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.28.down_proj.weight_scale": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.28.gate_proj.weight": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.28.gate_proj.weight_scale": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.28.up_proj.weight": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.28.up_proj.weight_scale": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.29.down_proj.weight": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.29.down_proj.weight_scale": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.29.gate_proj.weight": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.29.gate_proj.weight_scale": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.29.up_proj.weight": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.29.up_proj.weight_scale": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.3.down_proj.weight": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.3.down_proj.weight_scale": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.3.gate_proj.weight": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.3.gate_proj.weight_scale": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.3.up_proj.weight": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.3.up_proj.weight_scale": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.30.down_proj.weight": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.30.down_proj.weight_scale": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.30.gate_proj.weight": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.30.gate_proj.weight_scale": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.30.up_proj.weight": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.30.up_proj.weight_scale": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.31.down_proj.weight": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.31.down_proj.weight_scale": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.31.gate_proj.weight": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.31.gate_proj.weight_scale": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.31.up_proj.weight": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.31.up_proj.weight_scale": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.32.down_proj.weight": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.32.down_proj.weight_scale": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.32.gate_proj.weight": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.32.gate_proj.weight_scale": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.32.up_proj.weight": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.32.up_proj.weight_scale": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.33.down_proj.weight": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.33.down_proj.weight_scale": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.33.gate_proj.weight": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.33.gate_proj.weight_scale": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.33.up_proj.weight": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.33.up_proj.weight_scale": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.34.down_proj.weight": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.34.down_proj.weight_scale": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.34.gate_proj.weight": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.34.gate_proj.weight_scale": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.34.up_proj.weight": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.34.up_proj.weight_scale": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.35.down_proj.weight": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.35.down_proj.weight_scale": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.35.gate_proj.weight": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.35.gate_proj.weight_scale": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.35.up_proj.weight": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.35.up_proj.weight_scale": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.36.down_proj.weight": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.36.down_proj.weight_scale": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.36.gate_proj.weight": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.36.gate_proj.weight_scale": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.36.up_proj.weight": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.36.up_proj.weight_scale": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.37.down_proj.weight": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.37.down_proj.weight_scale": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.37.gate_proj.weight": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.37.gate_proj.weight_scale": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.37.up_proj.weight": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.37.up_proj.weight_scale": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.38.down_proj.weight": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.38.down_proj.weight_scale": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.38.gate_proj.weight": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.38.gate_proj.weight_scale": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.38.up_proj.weight": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.38.up_proj.weight_scale": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.39.down_proj.weight": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.39.down_proj.weight_scale": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.39.gate_proj.weight": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.39.gate_proj.weight_scale": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.39.up_proj.weight": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.39.up_proj.weight_scale": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.4.down_proj.weight": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.4.down_proj.weight_scale": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.4.gate_proj.weight": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.4.gate_proj.weight_scale": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.4.up_proj.weight": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.4.up_proj.weight_scale": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.40.down_proj.weight": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.40.down_proj.weight_scale": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.40.gate_proj.weight": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.40.gate_proj.weight_scale": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.40.up_proj.weight": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.40.up_proj.weight_scale": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.41.down_proj.weight": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.41.down_proj.weight_scale": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.41.gate_proj.weight": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.41.gate_proj.weight_scale": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.41.up_proj.weight": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.41.up_proj.weight_scale": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.42.down_proj.weight": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.42.down_proj.weight_scale": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.42.gate_proj.weight": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.42.gate_proj.weight_scale": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.42.up_proj.weight": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.42.up_proj.weight_scale": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.43.down_proj.weight": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.43.down_proj.weight_scale": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.43.gate_proj.weight": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.43.gate_proj.weight_scale": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.43.up_proj.weight": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.43.up_proj.weight_scale": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.44.down_proj.weight": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.44.down_proj.weight_scale": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.44.gate_proj.weight": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.44.gate_proj.weight_scale": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.44.up_proj.weight": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.44.up_proj.weight_scale": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.45.down_proj.weight": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.45.down_proj.weight_scale": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.45.gate_proj.weight": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.45.gate_proj.weight_scale": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.45.up_proj.weight": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.45.up_proj.weight_scale": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.46.down_proj.weight": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.46.down_proj.weight_scale": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.46.gate_proj.weight": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.46.gate_proj.weight_scale": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.46.up_proj.weight": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.46.up_proj.weight_scale": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.47.down_proj.weight": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.47.down_proj.weight_scale": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.47.gate_proj.weight": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.47.gate_proj.weight_scale": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.47.up_proj.weight": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.47.up_proj.weight_scale": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.48.down_proj.weight": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.48.down_proj.weight_scale": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.48.gate_proj.weight": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.48.gate_proj.weight_scale": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.48.up_proj.weight": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.48.up_proj.weight_scale": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.49.down_proj.weight": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.49.down_proj.weight_scale": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.49.gate_proj.weight": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.49.gate_proj.weight_scale": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.49.up_proj.weight": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.49.up_proj.weight_scale": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.5.down_proj.weight": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.5.down_proj.weight_scale": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.5.gate_proj.weight": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.5.gate_proj.weight_scale": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.5.up_proj.weight": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.5.up_proj.weight_scale": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.50.down_proj.weight": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.50.down_proj.weight_scale": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.50.gate_proj.weight": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.50.gate_proj.weight_scale": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.50.up_proj.weight": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.50.up_proj.weight_scale": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.51.down_proj.weight": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.51.down_proj.weight_scale": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.51.gate_proj.weight": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.51.gate_proj.weight_scale": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.51.up_proj.weight": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.51.up_proj.weight_scale": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.52.down_proj.weight": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.52.down_proj.weight_scale": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.52.gate_proj.weight": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.52.gate_proj.weight_scale": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.52.up_proj.weight": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.52.up_proj.weight_scale": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.53.down_proj.weight": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.53.down_proj.weight_scale": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.53.gate_proj.weight": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.53.gate_proj.weight_scale": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.53.up_proj.weight": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.53.up_proj.weight_scale": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.54.down_proj.weight": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.54.down_proj.weight_scale": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.54.gate_proj.weight": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.54.gate_proj.weight_scale": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.54.up_proj.weight": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.54.up_proj.weight_scale": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.55.down_proj.weight": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.55.down_proj.weight_scale": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.55.gate_proj.weight": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.55.gate_proj.weight_scale": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.55.up_proj.weight": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.55.up_proj.weight_scale": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.56.down_proj.weight": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.56.down_proj.weight_scale": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.56.gate_proj.weight": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.56.gate_proj.weight_scale": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.56.up_proj.weight": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.56.up_proj.weight_scale": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.57.down_proj.weight": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.57.down_proj.weight_scale": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.57.gate_proj.weight": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.57.gate_proj.weight_scale": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.57.up_proj.weight": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.57.up_proj.weight_scale": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.58.down_proj.weight": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.58.down_proj.weight_scale": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.58.gate_proj.weight": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.58.gate_proj.weight_scale": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.58.up_proj.weight": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.58.up_proj.weight_scale": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.59.down_proj.weight": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.59.down_proj.weight_scale": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.59.gate_proj.weight": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.59.gate_proj.weight_scale": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.59.up_proj.weight": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.59.up_proj.weight_scale": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.6.down_proj.weight": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.6.down_proj.weight_scale": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.6.gate_proj.weight": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.6.gate_proj.weight_scale": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.6.up_proj.weight": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.6.up_proj.weight_scale": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.60.down_proj.weight": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.60.down_proj.weight_scale": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.60.gate_proj.weight": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.60.gate_proj.weight_scale": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.60.up_proj.weight": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.60.up_proj.weight_scale": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.61.down_proj.weight": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.61.down_proj.weight_scale": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.61.gate_proj.weight": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.61.gate_proj.weight_scale": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.61.up_proj.weight": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.61.up_proj.weight_scale": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.62.down_proj.weight": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.62.down_proj.weight_scale": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.62.gate_proj.weight": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.62.gate_proj.weight_scale": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.62.up_proj.weight": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.62.up_proj.weight_scale": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.63.down_proj.weight": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.63.down_proj.weight_scale": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.63.gate_proj.weight": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.63.gate_proj.weight_scale": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.63.up_proj.weight": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.63.up_proj.weight_scale": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.64.down_proj.weight": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.64.down_proj.weight_scale": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.64.gate_proj.weight": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.64.gate_proj.weight_scale": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.64.up_proj.weight": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.64.up_proj.weight_scale": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.65.down_proj.weight": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.65.down_proj.weight_scale": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.65.gate_proj.weight": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.65.gate_proj.weight_scale": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.65.up_proj.weight": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.65.up_proj.weight_scale": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.66.down_proj.weight": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.66.down_proj.weight_scale": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.66.gate_proj.weight": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.66.gate_proj.weight_scale": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.66.up_proj.weight": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.66.up_proj.weight_scale": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.67.down_proj.weight": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.67.down_proj.weight_scale": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.67.gate_proj.weight": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.67.gate_proj.weight_scale": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.67.up_proj.weight": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.67.up_proj.weight_scale": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.68.down_proj.weight": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.68.down_proj.weight_scale": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.68.gate_proj.weight": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.68.gate_proj.weight_scale": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.68.up_proj.weight": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.68.up_proj.weight_scale": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.69.down_proj.weight": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.69.down_proj.weight_scale": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.69.gate_proj.weight": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.69.gate_proj.weight_scale": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.69.up_proj.weight": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.69.up_proj.weight_scale": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.7.down_proj.weight": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.7.down_proj.weight_scale": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.7.gate_proj.weight": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.7.gate_proj.weight_scale": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.7.up_proj.weight": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.7.up_proj.weight_scale": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.70.down_proj.weight": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.70.down_proj.weight_scale": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.70.gate_proj.weight": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.70.gate_proj.weight_scale": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.70.up_proj.weight": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.70.up_proj.weight_scale": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.71.down_proj.weight": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.71.down_proj.weight_scale": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.71.gate_proj.weight": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.71.gate_proj.weight_scale": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.71.up_proj.weight": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.71.up_proj.weight_scale": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.72.down_proj.weight": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.72.down_proj.weight_scale": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.72.gate_proj.weight": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.72.gate_proj.weight_scale": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.72.up_proj.weight": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.72.up_proj.weight_scale": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.73.down_proj.weight": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.73.down_proj.weight_scale": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.73.gate_proj.weight": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.73.gate_proj.weight_scale": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.73.up_proj.weight": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.73.up_proj.weight_scale": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.74.down_proj.weight": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.74.down_proj.weight_scale": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.74.gate_proj.weight": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.74.gate_proj.weight_scale": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.74.up_proj.weight": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.74.up_proj.weight_scale": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.75.down_proj.weight": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.75.down_proj.weight_scale": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.75.gate_proj.weight": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.75.gate_proj.weight_scale": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.75.up_proj.weight": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.75.up_proj.weight_scale": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.76.down_proj.weight": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.76.down_proj.weight_scale": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.76.gate_proj.weight": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.76.gate_proj.weight_scale": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.76.up_proj.weight": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.76.up_proj.weight_scale": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.77.down_proj.weight": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.77.down_proj.weight_scale": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.77.gate_proj.weight": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.77.gate_proj.weight_scale": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.77.up_proj.weight": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.77.up_proj.weight_scale": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.78.down_proj.weight": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.78.down_proj.weight_scale": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.78.gate_proj.weight": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.78.gate_proj.weight_scale": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.78.up_proj.weight": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.78.up_proj.weight_scale": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.79.down_proj.weight": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.79.down_proj.weight_scale": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.79.gate_proj.weight": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.79.gate_proj.weight_scale": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.79.up_proj.weight": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.79.up_proj.weight_scale": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.8.down_proj.weight": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.8.down_proj.weight_scale": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.8.gate_proj.weight": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.8.gate_proj.weight_scale": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.8.up_proj.weight": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.8.up_proj.weight_scale": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.80.down_proj.weight": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.80.down_proj.weight_scale": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.80.gate_proj.weight": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.80.gate_proj.weight_scale": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.80.up_proj.weight": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.80.up_proj.weight_scale": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.81.down_proj.weight": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.81.down_proj.weight_scale": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.81.gate_proj.weight": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.81.gate_proj.weight_scale": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.81.up_proj.weight": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.81.up_proj.weight_scale": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.82.down_proj.weight": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.82.down_proj.weight_scale": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.82.gate_proj.weight": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.82.gate_proj.weight_scale": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.82.up_proj.weight": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.82.up_proj.weight_scale": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.83.down_proj.weight": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.83.down_proj.weight_scale": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.83.gate_proj.weight": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.83.gate_proj.weight_scale": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.83.up_proj.weight": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.83.up_proj.weight_scale": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.84.down_proj.weight": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.84.down_proj.weight_scale": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.84.gate_proj.weight": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.84.gate_proj.weight_scale": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.84.up_proj.weight": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.84.up_proj.weight_scale": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.85.down_proj.weight": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.85.down_proj.weight_scale": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.85.gate_proj.weight": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.85.gate_proj.weight_scale": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.85.up_proj.weight": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.85.up_proj.weight_scale": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.86.down_proj.weight": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.86.down_proj.weight_scale": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.86.gate_proj.weight": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.86.gate_proj.weight_scale": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.86.up_proj.weight": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.86.up_proj.weight_scale": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.87.down_proj.weight": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.87.down_proj.weight_scale": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.87.gate_proj.weight": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.87.gate_proj.weight_scale": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.87.up_proj.weight": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.87.up_proj.weight_scale": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.88.down_proj.weight": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.88.down_proj.weight_scale": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.88.gate_proj.weight": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.88.gate_proj.weight_scale": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.88.up_proj.weight": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.88.up_proj.weight_scale": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.89.down_proj.weight": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.89.down_proj.weight_scale": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.89.gate_proj.weight": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.89.gate_proj.weight_scale": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.89.up_proj.weight": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.89.up_proj.weight_scale": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.9.down_proj.weight": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.9.down_proj.weight_scale": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.9.gate_proj.weight": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.9.gate_proj.weight_scale": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.9.up_proj.weight": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.9.up_proj.weight_scale": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.90.down_proj.weight": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.90.down_proj.weight_scale": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.90.gate_proj.weight": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.90.gate_proj.weight_scale": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.90.up_proj.weight": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.90.up_proj.weight_scale": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.91.down_proj.weight": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.91.down_proj.weight_scale": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.91.gate_proj.weight": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.91.gate_proj.weight_scale": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.91.up_proj.weight": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.91.up_proj.weight_scale": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.92.down_proj.weight": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.92.down_proj.weight_scale": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.92.gate_proj.weight": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.92.gate_proj.weight_scale": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.92.up_proj.weight": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.92.up_proj.weight_scale": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.93.down_proj.weight": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.93.down_proj.weight_scale": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.93.gate_proj.weight": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.93.gate_proj.weight_scale": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.93.up_proj.weight": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.93.up_proj.weight_scale": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.94.down_proj.weight": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.94.down_proj.weight_scale": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.94.gate_proj.weight": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.94.gate_proj.weight_scale": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.94.up_proj.weight": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.94.up_proj.weight_scale": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.95.down_proj.weight": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.95.down_proj.weight_scale": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.95.gate_proj.weight": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.95.gate_proj.weight_scale": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.95.up_proj.weight": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.95.up_proj.weight_scale": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.96.down_proj.weight": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.96.down_proj.weight_scale": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.96.gate_proj.weight": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.96.gate_proj.weight_scale": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.96.up_proj.weight": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.96.up_proj.weight_scale": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.97.down_proj.weight": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.97.down_proj.weight_scale": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.97.gate_proj.weight": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.97.gate_proj.weight_scale": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.97.up_proj.weight": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.97.up_proj.weight_scale": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.98.down_proj.weight": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.98.down_proj.weight_scale": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.98.gate_proj.weight": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.98.gate_proj.weight_scale": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.98.up_proj.weight": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.98.up_proj.weight_scale": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.99.down_proj.weight": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.99.down_proj.weight_scale": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.99.gate_proj.weight": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.99.gate_proj.weight_scale": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.99.up_proj.weight": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.99.up_proj.weight_scale": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.gate.e_score_correction_bias": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.gate.weight": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.shared_experts.down_proj.weight": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.shared_experts.down_proj.weight_scale": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.shared_experts.gate_proj.weight": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.shared_experts.gate_proj.weight_scale": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.shared_experts.up_proj.weight": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.shared_experts.up_proj.weight_scale": "model-00082-of-00092.safetensors",
+ "model.layers.81.post_attention_layernorm.weight": "model-00082-of-00092.safetensors",
+ "model.layers.81.self_attn.k_norm.weight": "model-00082-of-00092.safetensors",
+ "model.layers.81.self_attn.k_proj.bias": "model-00082-of-00092.safetensors",
+ "model.layers.81.self_attn.k_proj.weight": "model-00082-of-00092.safetensors",
+ "model.layers.81.self_attn.k_proj.weight_scale": "model-00082-of-00092.safetensors",
+ "model.layers.81.self_attn.o_proj.weight": "model-00082-of-00092.safetensors",
+ "model.layers.81.self_attn.o_proj.weight_scale": "model-00082-of-00092.safetensors",
+ "model.layers.81.self_attn.q_norm.weight": "model-00082-of-00092.safetensors",
+ "model.layers.81.self_attn.q_proj.bias": "model-00082-of-00092.safetensors",
+ "model.layers.81.self_attn.q_proj.weight": "model-00082-of-00092.safetensors",
+ "model.layers.81.self_attn.q_proj.weight_scale": "model-00082-of-00092.safetensors",
+ "model.layers.81.self_attn.v_proj.bias": "model-00082-of-00092.safetensors",
+ "model.layers.81.self_attn.v_proj.weight": "model-00082-of-00092.safetensors",
+ "model.layers.81.self_attn.v_proj.weight_scale": "model-00082-of-00092.safetensors",
+ "model.layers.82.input_layernorm.weight": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.0.down_proj.weight": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.0.down_proj.weight_scale": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.0.gate_proj.weight": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.0.gate_proj.weight_scale": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.0.up_proj.weight": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.0.up_proj.weight_scale": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.1.down_proj.weight": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.1.down_proj.weight_scale": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.1.gate_proj.weight": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.1.gate_proj.weight_scale": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.1.up_proj.weight": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.1.up_proj.weight_scale": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.10.down_proj.weight": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.10.down_proj.weight_scale": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.10.gate_proj.weight": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.10.gate_proj.weight_scale": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.10.up_proj.weight": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.10.up_proj.weight_scale": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.100.down_proj.weight": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.100.down_proj.weight_scale": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.100.gate_proj.weight": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.100.gate_proj.weight_scale": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.100.up_proj.weight": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.100.up_proj.weight_scale": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.101.down_proj.weight": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.101.down_proj.weight_scale": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.101.gate_proj.weight": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.101.gate_proj.weight_scale": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.101.up_proj.weight": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.101.up_proj.weight_scale": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.102.down_proj.weight": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.102.down_proj.weight_scale": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.102.gate_proj.weight": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.102.gate_proj.weight_scale": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.102.up_proj.weight": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.102.up_proj.weight_scale": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.103.down_proj.weight": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.103.down_proj.weight_scale": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.103.gate_proj.weight": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.103.gate_proj.weight_scale": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.103.up_proj.weight": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.103.up_proj.weight_scale": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.104.down_proj.weight": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.104.down_proj.weight_scale": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.104.gate_proj.weight": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.104.gate_proj.weight_scale": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.104.up_proj.weight": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.104.up_proj.weight_scale": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.105.down_proj.weight": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.105.down_proj.weight_scale": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.105.gate_proj.weight": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.105.gate_proj.weight_scale": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.105.up_proj.weight": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.105.up_proj.weight_scale": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.106.down_proj.weight": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.106.down_proj.weight_scale": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.106.gate_proj.weight": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.106.gate_proj.weight_scale": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.106.up_proj.weight": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.106.up_proj.weight_scale": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.107.down_proj.weight": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.107.down_proj.weight_scale": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.107.gate_proj.weight": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.107.gate_proj.weight_scale": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.107.up_proj.weight": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.107.up_proj.weight_scale": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.108.down_proj.weight": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.108.down_proj.weight_scale": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.108.gate_proj.weight": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.108.gate_proj.weight_scale": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.108.up_proj.weight": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.108.up_proj.weight_scale": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.109.down_proj.weight": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.109.down_proj.weight_scale": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.109.gate_proj.weight": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.109.gate_proj.weight_scale": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.109.up_proj.weight": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.109.up_proj.weight_scale": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.11.down_proj.weight": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.11.down_proj.weight_scale": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.11.gate_proj.weight": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.11.gate_proj.weight_scale": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.11.up_proj.weight": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.11.up_proj.weight_scale": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.110.down_proj.weight": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.110.down_proj.weight_scale": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.110.gate_proj.weight": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.110.gate_proj.weight_scale": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.110.up_proj.weight": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.110.up_proj.weight_scale": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.111.down_proj.weight": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.111.down_proj.weight_scale": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.111.gate_proj.weight": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.111.gate_proj.weight_scale": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.111.up_proj.weight": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.111.up_proj.weight_scale": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.112.down_proj.weight": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.112.down_proj.weight_scale": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.112.gate_proj.weight": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.112.gate_proj.weight_scale": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.112.up_proj.weight": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.112.up_proj.weight_scale": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.113.down_proj.weight": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.113.down_proj.weight_scale": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.113.gate_proj.weight": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.113.gate_proj.weight_scale": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.113.up_proj.weight": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.113.up_proj.weight_scale": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.114.down_proj.weight": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.114.down_proj.weight_scale": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.114.gate_proj.weight": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.114.gate_proj.weight_scale": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.114.up_proj.weight": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.114.up_proj.weight_scale": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.115.down_proj.weight": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.115.down_proj.weight_scale": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.115.gate_proj.weight": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.115.gate_proj.weight_scale": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.115.up_proj.weight": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.115.up_proj.weight_scale": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.116.down_proj.weight": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.116.down_proj.weight_scale": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.116.gate_proj.weight": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.116.gate_proj.weight_scale": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.116.up_proj.weight": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.116.up_proj.weight_scale": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.117.down_proj.weight": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.117.down_proj.weight_scale": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.117.gate_proj.weight": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.117.gate_proj.weight_scale": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.117.up_proj.weight": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.117.up_proj.weight_scale": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.118.down_proj.weight": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.118.down_proj.weight_scale": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.118.gate_proj.weight": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.118.gate_proj.weight_scale": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.118.up_proj.weight": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.118.up_proj.weight_scale": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.119.down_proj.weight": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.119.down_proj.weight_scale": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.119.gate_proj.weight": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.119.gate_proj.weight_scale": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.119.up_proj.weight": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.119.up_proj.weight_scale": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.12.down_proj.weight": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.12.down_proj.weight_scale": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.12.gate_proj.weight": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.12.gate_proj.weight_scale": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.12.up_proj.weight": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.12.up_proj.weight_scale": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.120.down_proj.weight": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.120.down_proj.weight_scale": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.120.gate_proj.weight": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.120.gate_proj.weight_scale": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.120.up_proj.weight": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.120.up_proj.weight_scale": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.121.down_proj.weight": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.121.down_proj.weight_scale": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.121.gate_proj.weight": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.121.gate_proj.weight_scale": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.121.up_proj.weight": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.121.up_proj.weight_scale": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.122.down_proj.weight": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.122.down_proj.weight_scale": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.122.gate_proj.weight": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.122.gate_proj.weight_scale": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.122.up_proj.weight": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.122.up_proj.weight_scale": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.123.down_proj.weight": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.123.down_proj.weight_scale": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.123.gate_proj.weight": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.123.gate_proj.weight_scale": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.123.up_proj.weight": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.123.up_proj.weight_scale": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.124.down_proj.weight": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.124.down_proj.weight_scale": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.124.gate_proj.weight": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.124.gate_proj.weight_scale": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.124.up_proj.weight": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.124.up_proj.weight_scale": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.125.down_proj.weight": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.125.down_proj.weight_scale": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.125.gate_proj.weight": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.125.gate_proj.weight_scale": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.125.up_proj.weight": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.125.up_proj.weight_scale": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.126.down_proj.weight": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.126.down_proj.weight_scale": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.126.gate_proj.weight": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.126.gate_proj.weight_scale": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.126.up_proj.weight": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.126.up_proj.weight_scale": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.127.down_proj.weight": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.127.down_proj.weight_scale": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.127.gate_proj.weight": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.127.gate_proj.weight_scale": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.127.up_proj.weight": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.127.up_proj.weight_scale": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.128.down_proj.weight": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.128.down_proj.weight_scale": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.128.gate_proj.weight": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.128.gate_proj.weight_scale": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.128.up_proj.weight": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.128.up_proj.weight_scale": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.129.down_proj.weight": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.129.down_proj.weight_scale": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.129.gate_proj.weight": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.129.gate_proj.weight_scale": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.129.up_proj.weight": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.129.up_proj.weight_scale": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.13.down_proj.weight": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.13.down_proj.weight_scale": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.13.gate_proj.weight": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.13.gate_proj.weight_scale": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.13.up_proj.weight": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.13.up_proj.weight_scale": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.130.down_proj.weight": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.130.down_proj.weight_scale": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.130.gate_proj.weight": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.130.gate_proj.weight_scale": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.130.up_proj.weight": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.130.up_proj.weight_scale": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.131.down_proj.weight": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.131.down_proj.weight_scale": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.131.gate_proj.weight": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.131.gate_proj.weight_scale": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.131.up_proj.weight": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.131.up_proj.weight_scale": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.132.down_proj.weight": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.132.down_proj.weight_scale": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.132.gate_proj.weight": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.132.gate_proj.weight_scale": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.132.up_proj.weight": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.132.up_proj.weight_scale": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.133.down_proj.weight": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.133.down_proj.weight_scale": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.133.gate_proj.weight": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.133.gate_proj.weight_scale": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.133.up_proj.weight": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.133.up_proj.weight_scale": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.134.down_proj.weight": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.134.down_proj.weight_scale": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.134.gate_proj.weight": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.134.gate_proj.weight_scale": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.134.up_proj.weight": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.134.up_proj.weight_scale": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.135.down_proj.weight": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.135.down_proj.weight_scale": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.135.gate_proj.weight": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.135.gate_proj.weight_scale": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.135.up_proj.weight": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.135.up_proj.weight_scale": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.136.down_proj.weight": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.136.down_proj.weight_scale": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.136.gate_proj.weight": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.136.gate_proj.weight_scale": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.136.up_proj.weight": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.136.up_proj.weight_scale": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.137.down_proj.weight": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.137.down_proj.weight_scale": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.137.gate_proj.weight": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.137.gate_proj.weight_scale": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.137.up_proj.weight": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.137.up_proj.weight_scale": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.138.down_proj.weight": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.138.down_proj.weight_scale": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.138.gate_proj.weight": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.138.gate_proj.weight_scale": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.138.up_proj.weight": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.138.up_proj.weight_scale": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.139.down_proj.weight": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.139.down_proj.weight_scale": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.139.gate_proj.weight": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.139.gate_proj.weight_scale": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.139.up_proj.weight": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.139.up_proj.weight_scale": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.14.down_proj.weight": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.14.down_proj.weight_scale": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.14.gate_proj.weight": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.14.gate_proj.weight_scale": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.14.up_proj.weight": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.14.up_proj.weight_scale": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.140.down_proj.weight": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.140.down_proj.weight_scale": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.140.gate_proj.weight": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.140.gate_proj.weight_scale": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.140.up_proj.weight": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.140.up_proj.weight_scale": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.141.down_proj.weight": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.141.down_proj.weight_scale": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.141.gate_proj.weight": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.141.gate_proj.weight_scale": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.141.up_proj.weight": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.141.up_proj.weight_scale": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.142.down_proj.weight": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.142.down_proj.weight_scale": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.142.gate_proj.weight": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.142.gate_proj.weight_scale": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.142.up_proj.weight": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.142.up_proj.weight_scale": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.143.down_proj.weight": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.143.down_proj.weight_scale": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.143.gate_proj.weight": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.143.gate_proj.weight_scale": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.143.up_proj.weight": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.143.up_proj.weight_scale": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.144.down_proj.weight": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.144.down_proj.weight_scale": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.144.gate_proj.weight": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.144.gate_proj.weight_scale": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.144.up_proj.weight": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.144.up_proj.weight_scale": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.145.down_proj.weight": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.145.down_proj.weight_scale": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.145.gate_proj.weight": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.145.gate_proj.weight_scale": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.145.up_proj.weight": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.145.up_proj.weight_scale": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.146.down_proj.weight": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.146.down_proj.weight_scale": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.146.gate_proj.weight": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.146.gate_proj.weight_scale": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.146.up_proj.weight": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.146.up_proj.weight_scale": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.147.down_proj.weight": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.147.down_proj.weight_scale": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.147.gate_proj.weight": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.147.gate_proj.weight_scale": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.147.up_proj.weight": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.147.up_proj.weight_scale": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.148.down_proj.weight": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.148.down_proj.weight_scale": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.148.gate_proj.weight": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.148.gate_proj.weight_scale": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.148.up_proj.weight": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.148.up_proj.weight_scale": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.149.down_proj.weight": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.149.down_proj.weight_scale": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.149.gate_proj.weight": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.149.gate_proj.weight_scale": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.149.up_proj.weight": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.149.up_proj.weight_scale": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.15.down_proj.weight": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.15.down_proj.weight_scale": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.15.gate_proj.weight": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.15.gate_proj.weight_scale": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.15.up_proj.weight": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.15.up_proj.weight_scale": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.150.down_proj.weight": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.150.down_proj.weight_scale": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.150.gate_proj.weight": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.150.gate_proj.weight_scale": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.150.up_proj.weight": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.150.up_proj.weight_scale": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.151.down_proj.weight": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.151.down_proj.weight_scale": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.151.gate_proj.weight": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.151.gate_proj.weight_scale": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.151.up_proj.weight": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.151.up_proj.weight_scale": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.152.down_proj.weight": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.152.down_proj.weight_scale": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.152.gate_proj.weight": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.152.gate_proj.weight_scale": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.152.up_proj.weight": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.152.up_proj.weight_scale": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.153.down_proj.weight": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.153.down_proj.weight_scale": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.153.gate_proj.weight": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.153.gate_proj.weight_scale": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.153.up_proj.weight": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.153.up_proj.weight_scale": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.154.down_proj.weight": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.154.down_proj.weight_scale": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.154.gate_proj.weight": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.154.gate_proj.weight_scale": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.154.up_proj.weight": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.154.up_proj.weight_scale": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.155.down_proj.weight": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.155.down_proj.weight_scale": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.155.gate_proj.weight": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.155.gate_proj.weight_scale": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.155.up_proj.weight": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.155.up_proj.weight_scale": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.156.down_proj.weight": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.156.down_proj.weight_scale": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.156.gate_proj.weight": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.156.gate_proj.weight_scale": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.156.up_proj.weight": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.156.up_proj.weight_scale": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.157.down_proj.weight": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.157.down_proj.weight_scale": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.157.gate_proj.weight": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.157.gate_proj.weight_scale": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.157.up_proj.weight": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.157.up_proj.weight_scale": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.158.down_proj.weight": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.158.down_proj.weight_scale": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.158.gate_proj.weight": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.158.gate_proj.weight_scale": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.158.up_proj.weight": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.158.up_proj.weight_scale": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.159.down_proj.weight": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.159.down_proj.weight_scale": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.159.gate_proj.weight": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.159.gate_proj.weight_scale": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.159.up_proj.weight": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.159.up_proj.weight_scale": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.16.down_proj.weight": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.16.down_proj.weight_scale": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.16.gate_proj.weight": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.16.gate_proj.weight_scale": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.16.up_proj.weight": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.16.up_proj.weight_scale": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.17.down_proj.weight": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.17.down_proj.weight_scale": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.17.gate_proj.weight": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.17.gate_proj.weight_scale": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.17.up_proj.weight": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.17.up_proj.weight_scale": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.18.down_proj.weight": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.18.down_proj.weight_scale": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.18.gate_proj.weight": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.18.gate_proj.weight_scale": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.18.up_proj.weight": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.18.up_proj.weight_scale": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.19.down_proj.weight": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.19.down_proj.weight_scale": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.19.gate_proj.weight": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.19.gate_proj.weight_scale": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.19.up_proj.weight": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.19.up_proj.weight_scale": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.2.down_proj.weight": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.2.down_proj.weight_scale": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.2.gate_proj.weight": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.2.gate_proj.weight_scale": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.2.up_proj.weight": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.2.up_proj.weight_scale": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.20.down_proj.weight": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.20.down_proj.weight_scale": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.20.gate_proj.weight": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.20.gate_proj.weight_scale": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.20.up_proj.weight": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.20.up_proj.weight_scale": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.21.down_proj.weight": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.21.down_proj.weight_scale": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.21.gate_proj.weight": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.21.gate_proj.weight_scale": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.21.up_proj.weight": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.21.up_proj.weight_scale": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.22.down_proj.weight": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.22.down_proj.weight_scale": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.22.gate_proj.weight": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.22.gate_proj.weight_scale": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.22.up_proj.weight": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.22.up_proj.weight_scale": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.23.down_proj.weight": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.23.down_proj.weight_scale": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.23.gate_proj.weight": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.23.gate_proj.weight_scale": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.23.up_proj.weight": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.23.up_proj.weight_scale": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.24.down_proj.weight": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.24.down_proj.weight_scale": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.24.gate_proj.weight": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.24.gate_proj.weight_scale": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.24.up_proj.weight": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.24.up_proj.weight_scale": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.25.down_proj.weight": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.25.down_proj.weight_scale": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.25.gate_proj.weight": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.25.gate_proj.weight_scale": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.25.up_proj.weight": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.25.up_proj.weight_scale": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.26.down_proj.weight": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.26.down_proj.weight_scale": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.26.gate_proj.weight": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.26.gate_proj.weight_scale": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.26.up_proj.weight": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.26.up_proj.weight_scale": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.27.down_proj.weight": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.27.down_proj.weight_scale": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.27.gate_proj.weight": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.27.gate_proj.weight_scale": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.27.up_proj.weight": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.27.up_proj.weight_scale": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.28.down_proj.weight": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.28.down_proj.weight_scale": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.28.gate_proj.weight": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.28.gate_proj.weight_scale": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.28.up_proj.weight": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.28.up_proj.weight_scale": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.29.down_proj.weight": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.29.down_proj.weight_scale": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.29.gate_proj.weight": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.29.gate_proj.weight_scale": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.29.up_proj.weight": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.29.up_proj.weight_scale": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.3.down_proj.weight": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.3.down_proj.weight_scale": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.3.gate_proj.weight": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.3.gate_proj.weight_scale": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.3.up_proj.weight": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.3.up_proj.weight_scale": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.30.down_proj.weight": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.30.down_proj.weight_scale": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.30.gate_proj.weight": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.30.gate_proj.weight_scale": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.30.up_proj.weight": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.30.up_proj.weight_scale": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.31.down_proj.weight": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.31.down_proj.weight_scale": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.31.gate_proj.weight": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.31.gate_proj.weight_scale": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.31.up_proj.weight": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.31.up_proj.weight_scale": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.32.down_proj.weight": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.32.down_proj.weight_scale": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.32.gate_proj.weight": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.32.gate_proj.weight_scale": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.32.up_proj.weight": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.32.up_proj.weight_scale": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.33.down_proj.weight": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.33.down_proj.weight_scale": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.33.gate_proj.weight": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.33.gate_proj.weight_scale": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.33.up_proj.weight": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.33.up_proj.weight_scale": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.34.down_proj.weight": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.34.down_proj.weight_scale": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.34.gate_proj.weight": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.34.gate_proj.weight_scale": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.34.up_proj.weight": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.34.up_proj.weight_scale": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.35.down_proj.weight": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.35.down_proj.weight_scale": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.35.gate_proj.weight": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.35.gate_proj.weight_scale": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.35.up_proj.weight": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.35.up_proj.weight_scale": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.36.down_proj.weight": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.36.down_proj.weight_scale": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.36.gate_proj.weight": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.36.gate_proj.weight_scale": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.36.up_proj.weight": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.36.up_proj.weight_scale": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.37.down_proj.weight": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.37.down_proj.weight_scale": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.37.gate_proj.weight": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.37.gate_proj.weight_scale": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.37.up_proj.weight": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.37.up_proj.weight_scale": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.38.down_proj.weight": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.38.down_proj.weight_scale": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.38.gate_proj.weight": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.38.gate_proj.weight_scale": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.38.up_proj.weight": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.38.up_proj.weight_scale": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.39.down_proj.weight": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.39.down_proj.weight_scale": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.39.gate_proj.weight": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.39.gate_proj.weight_scale": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.39.up_proj.weight": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.39.up_proj.weight_scale": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.4.down_proj.weight": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.4.down_proj.weight_scale": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.4.gate_proj.weight": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.4.gate_proj.weight_scale": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.4.up_proj.weight": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.4.up_proj.weight_scale": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.40.down_proj.weight": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.40.down_proj.weight_scale": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.40.gate_proj.weight": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.40.gate_proj.weight_scale": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.40.up_proj.weight": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.40.up_proj.weight_scale": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.41.down_proj.weight": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.41.down_proj.weight_scale": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.41.gate_proj.weight": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.41.gate_proj.weight_scale": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.41.up_proj.weight": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.41.up_proj.weight_scale": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.42.down_proj.weight": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.42.down_proj.weight_scale": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.42.gate_proj.weight": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.42.gate_proj.weight_scale": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.42.up_proj.weight": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.42.up_proj.weight_scale": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.43.down_proj.weight": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.43.down_proj.weight_scale": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.43.gate_proj.weight": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.43.gate_proj.weight_scale": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.43.up_proj.weight": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.43.up_proj.weight_scale": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.44.down_proj.weight": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.44.down_proj.weight_scale": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.44.gate_proj.weight": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.44.gate_proj.weight_scale": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.44.up_proj.weight": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.44.up_proj.weight_scale": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.45.down_proj.weight": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.45.down_proj.weight_scale": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.45.gate_proj.weight": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.45.gate_proj.weight_scale": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.45.up_proj.weight": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.45.up_proj.weight_scale": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.46.down_proj.weight": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.46.down_proj.weight_scale": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.46.gate_proj.weight": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.46.gate_proj.weight_scale": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.46.up_proj.weight": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.46.up_proj.weight_scale": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.47.down_proj.weight": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.47.down_proj.weight_scale": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.47.gate_proj.weight": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.47.gate_proj.weight_scale": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.47.up_proj.weight": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.47.up_proj.weight_scale": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.48.down_proj.weight": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.48.down_proj.weight_scale": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.48.gate_proj.weight": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.48.gate_proj.weight_scale": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.48.up_proj.weight": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.48.up_proj.weight_scale": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.49.down_proj.weight": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.49.down_proj.weight_scale": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.49.gate_proj.weight": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.49.gate_proj.weight_scale": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.49.up_proj.weight": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.49.up_proj.weight_scale": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.5.down_proj.weight": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.5.down_proj.weight_scale": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.5.gate_proj.weight": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.5.gate_proj.weight_scale": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.5.up_proj.weight": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.5.up_proj.weight_scale": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.50.down_proj.weight": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.50.down_proj.weight_scale": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.50.gate_proj.weight": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.50.gate_proj.weight_scale": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.50.up_proj.weight": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.50.up_proj.weight_scale": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.51.down_proj.weight": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.51.down_proj.weight_scale": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.51.gate_proj.weight": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.51.gate_proj.weight_scale": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.51.up_proj.weight": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.51.up_proj.weight_scale": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.52.down_proj.weight": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.52.down_proj.weight_scale": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.52.gate_proj.weight": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.52.gate_proj.weight_scale": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.52.up_proj.weight": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.52.up_proj.weight_scale": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.53.down_proj.weight": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.53.down_proj.weight_scale": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.53.gate_proj.weight": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.53.gate_proj.weight_scale": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.53.up_proj.weight": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.53.up_proj.weight_scale": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.54.down_proj.weight": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.54.down_proj.weight_scale": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.54.gate_proj.weight": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.54.gate_proj.weight_scale": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.54.up_proj.weight": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.54.up_proj.weight_scale": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.55.down_proj.weight": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.55.down_proj.weight_scale": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.55.gate_proj.weight": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.55.gate_proj.weight_scale": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.55.up_proj.weight": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.55.up_proj.weight_scale": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.56.down_proj.weight": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.56.down_proj.weight_scale": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.56.gate_proj.weight": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.56.gate_proj.weight_scale": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.56.up_proj.weight": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.56.up_proj.weight_scale": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.57.down_proj.weight": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.57.down_proj.weight_scale": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.57.gate_proj.weight": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.57.gate_proj.weight_scale": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.57.up_proj.weight": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.57.up_proj.weight_scale": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.58.down_proj.weight": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.58.down_proj.weight_scale": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.58.gate_proj.weight": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.58.gate_proj.weight_scale": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.58.up_proj.weight": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.58.up_proj.weight_scale": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.59.down_proj.weight": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.59.down_proj.weight_scale": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.59.gate_proj.weight": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.59.gate_proj.weight_scale": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.59.up_proj.weight": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.59.up_proj.weight_scale": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.6.down_proj.weight": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.6.down_proj.weight_scale": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.6.gate_proj.weight": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.6.gate_proj.weight_scale": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.6.up_proj.weight": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.6.up_proj.weight_scale": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.60.down_proj.weight": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.60.down_proj.weight_scale": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.60.gate_proj.weight": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.60.gate_proj.weight_scale": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.60.up_proj.weight": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.60.up_proj.weight_scale": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.61.down_proj.weight": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.61.down_proj.weight_scale": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.61.gate_proj.weight": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.61.gate_proj.weight_scale": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.61.up_proj.weight": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.61.up_proj.weight_scale": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.62.down_proj.weight": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.62.down_proj.weight_scale": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.62.gate_proj.weight": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.62.gate_proj.weight_scale": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.62.up_proj.weight": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.62.up_proj.weight_scale": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.63.down_proj.weight": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.63.down_proj.weight_scale": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.63.gate_proj.weight": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.63.gate_proj.weight_scale": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.63.up_proj.weight": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.63.up_proj.weight_scale": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.64.down_proj.weight": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.64.down_proj.weight_scale": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.64.gate_proj.weight": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.64.gate_proj.weight_scale": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.64.up_proj.weight": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.64.up_proj.weight_scale": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.65.down_proj.weight": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.65.down_proj.weight_scale": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.65.gate_proj.weight": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.65.gate_proj.weight_scale": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.65.up_proj.weight": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.65.up_proj.weight_scale": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.66.down_proj.weight": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.66.down_proj.weight_scale": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.66.gate_proj.weight": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.66.gate_proj.weight_scale": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.66.up_proj.weight": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.66.up_proj.weight_scale": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.67.down_proj.weight": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.67.down_proj.weight_scale": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.67.gate_proj.weight": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.67.gate_proj.weight_scale": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.67.up_proj.weight": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.67.up_proj.weight_scale": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.68.down_proj.weight": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.68.down_proj.weight_scale": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.68.gate_proj.weight": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.68.gate_proj.weight_scale": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.68.up_proj.weight": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.68.up_proj.weight_scale": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.69.down_proj.weight": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.69.down_proj.weight_scale": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.69.gate_proj.weight": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.69.gate_proj.weight_scale": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.69.up_proj.weight": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.69.up_proj.weight_scale": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.7.down_proj.weight": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.7.down_proj.weight_scale": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.7.gate_proj.weight": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.7.gate_proj.weight_scale": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.7.up_proj.weight": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.7.up_proj.weight_scale": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.70.down_proj.weight": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.70.down_proj.weight_scale": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.70.gate_proj.weight": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.70.gate_proj.weight_scale": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.70.up_proj.weight": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.70.up_proj.weight_scale": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.71.down_proj.weight": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.71.down_proj.weight_scale": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.71.gate_proj.weight": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.71.gate_proj.weight_scale": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.71.up_proj.weight": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.71.up_proj.weight_scale": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.72.down_proj.weight": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.72.down_proj.weight_scale": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.72.gate_proj.weight": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.72.gate_proj.weight_scale": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.72.up_proj.weight": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.72.up_proj.weight_scale": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.73.down_proj.weight": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.73.down_proj.weight_scale": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.73.gate_proj.weight": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.73.gate_proj.weight_scale": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.73.up_proj.weight": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.73.up_proj.weight_scale": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.74.down_proj.weight": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.74.down_proj.weight_scale": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.74.gate_proj.weight": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.74.gate_proj.weight_scale": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.74.up_proj.weight": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.74.up_proj.weight_scale": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.75.down_proj.weight": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.75.down_proj.weight_scale": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.75.gate_proj.weight": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.75.gate_proj.weight_scale": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.75.up_proj.weight": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.75.up_proj.weight_scale": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.76.down_proj.weight": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.76.down_proj.weight_scale": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.76.gate_proj.weight": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.76.gate_proj.weight_scale": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.76.up_proj.weight": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.76.up_proj.weight_scale": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.77.down_proj.weight": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.77.down_proj.weight_scale": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.77.gate_proj.weight": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.77.gate_proj.weight_scale": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.77.up_proj.weight": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.77.up_proj.weight_scale": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.78.down_proj.weight": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.78.down_proj.weight_scale": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.78.gate_proj.weight": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.78.gate_proj.weight_scale": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.78.up_proj.weight": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.78.up_proj.weight_scale": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.79.down_proj.weight": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.79.down_proj.weight_scale": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.79.gate_proj.weight": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.79.gate_proj.weight_scale": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.79.up_proj.weight": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.79.up_proj.weight_scale": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.8.down_proj.weight": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.8.down_proj.weight_scale": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.8.gate_proj.weight": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.8.gate_proj.weight_scale": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.8.up_proj.weight": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.8.up_proj.weight_scale": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.80.down_proj.weight": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.80.down_proj.weight_scale": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.80.gate_proj.weight": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.80.gate_proj.weight_scale": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.80.up_proj.weight": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.80.up_proj.weight_scale": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.81.down_proj.weight": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.81.down_proj.weight_scale": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.81.gate_proj.weight": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.81.gate_proj.weight_scale": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.81.up_proj.weight": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.81.up_proj.weight_scale": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.82.down_proj.weight": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.82.down_proj.weight_scale": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.82.gate_proj.weight": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.82.gate_proj.weight_scale": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.82.up_proj.weight": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.82.up_proj.weight_scale": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.83.down_proj.weight": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.83.down_proj.weight_scale": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.83.gate_proj.weight": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.83.gate_proj.weight_scale": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.83.up_proj.weight": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.83.up_proj.weight_scale": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.84.down_proj.weight": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.84.down_proj.weight_scale": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.84.gate_proj.weight": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.84.gate_proj.weight_scale": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.84.up_proj.weight": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.84.up_proj.weight_scale": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.85.down_proj.weight": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.85.down_proj.weight_scale": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.85.gate_proj.weight": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.85.gate_proj.weight_scale": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.85.up_proj.weight": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.85.up_proj.weight_scale": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.86.down_proj.weight": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.86.down_proj.weight_scale": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.86.gate_proj.weight": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.86.gate_proj.weight_scale": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.86.up_proj.weight": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.86.up_proj.weight_scale": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.87.down_proj.weight": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.87.down_proj.weight_scale": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.87.gate_proj.weight": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.87.gate_proj.weight_scale": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.87.up_proj.weight": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.87.up_proj.weight_scale": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.88.down_proj.weight": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.88.down_proj.weight_scale": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.88.gate_proj.weight": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.88.gate_proj.weight_scale": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.88.up_proj.weight": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.88.up_proj.weight_scale": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.89.down_proj.weight": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.89.down_proj.weight_scale": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.89.gate_proj.weight": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.89.gate_proj.weight_scale": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.89.up_proj.weight": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.89.up_proj.weight_scale": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.9.down_proj.weight": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.9.down_proj.weight_scale": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.9.gate_proj.weight": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.9.gate_proj.weight_scale": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.9.up_proj.weight": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.9.up_proj.weight_scale": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.90.down_proj.weight": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.90.down_proj.weight_scale": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.90.gate_proj.weight": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.90.gate_proj.weight_scale": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.90.up_proj.weight": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.90.up_proj.weight_scale": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.91.down_proj.weight": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.91.down_proj.weight_scale": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.91.gate_proj.weight": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.91.gate_proj.weight_scale": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.91.up_proj.weight": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.91.up_proj.weight_scale": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.92.down_proj.weight": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.92.down_proj.weight_scale": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.92.gate_proj.weight": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.92.gate_proj.weight_scale": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.92.up_proj.weight": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.92.up_proj.weight_scale": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.93.down_proj.weight": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.93.down_proj.weight_scale": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.93.gate_proj.weight": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.93.gate_proj.weight_scale": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.93.up_proj.weight": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.93.up_proj.weight_scale": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.94.down_proj.weight": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.94.down_proj.weight_scale": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.94.gate_proj.weight": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.94.gate_proj.weight_scale": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.94.up_proj.weight": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.94.up_proj.weight_scale": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.95.down_proj.weight": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.95.down_proj.weight_scale": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.95.gate_proj.weight": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.95.gate_proj.weight_scale": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.95.up_proj.weight": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.95.up_proj.weight_scale": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.96.down_proj.weight": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.96.down_proj.weight_scale": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.96.gate_proj.weight": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.96.gate_proj.weight_scale": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.96.up_proj.weight": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.96.up_proj.weight_scale": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.97.down_proj.weight": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.97.down_proj.weight_scale": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.97.gate_proj.weight": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.97.gate_proj.weight_scale": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.97.up_proj.weight": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.97.up_proj.weight_scale": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.98.down_proj.weight": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.98.down_proj.weight_scale": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.98.gate_proj.weight": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.98.gate_proj.weight_scale": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.98.up_proj.weight": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.98.up_proj.weight_scale": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.99.down_proj.weight": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.99.down_proj.weight_scale": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.99.gate_proj.weight": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.99.gate_proj.weight_scale": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.99.up_proj.weight": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.99.up_proj.weight_scale": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.gate.e_score_correction_bias": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.gate.weight": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.shared_experts.down_proj.weight": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.shared_experts.down_proj.weight_scale": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.shared_experts.gate_proj.weight": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.shared_experts.gate_proj.weight_scale": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.shared_experts.up_proj.weight": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.shared_experts.up_proj.weight_scale": "model-00083-of-00092.safetensors",
+ "model.layers.82.post_attention_layernorm.weight": "model-00083-of-00092.safetensors",
+ "model.layers.82.self_attn.k_norm.weight": "model-00083-of-00092.safetensors",
+ "model.layers.82.self_attn.k_proj.bias": "model-00083-of-00092.safetensors",
+ "model.layers.82.self_attn.k_proj.weight": "model-00083-of-00092.safetensors",
+ "model.layers.82.self_attn.k_proj.weight_scale": "model-00083-of-00092.safetensors",
+ "model.layers.82.self_attn.o_proj.weight": "model-00083-of-00092.safetensors",
+ "model.layers.82.self_attn.o_proj.weight_scale": "model-00083-of-00092.safetensors",
+ "model.layers.82.self_attn.q_norm.weight": "model-00083-of-00092.safetensors",
+ "model.layers.82.self_attn.q_proj.bias": "model-00083-of-00092.safetensors",
+ "model.layers.82.self_attn.q_proj.weight": "model-00083-of-00092.safetensors",
+ "model.layers.82.self_attn.q_proj.weight_scale": "model-00083-of-00092.safetensors",
+ "model.layers.82.self_attn.v_proj.bias": "model-00083-of-00092.safetensors",
+ "model.layers.82.self_attn.v_proj.weight": "model-00083-of-00092.safetensors",
+ "model.layers.82.self_attn.v_proj.weight_scale": "model-00083-of-00092.safetensors",
+ "model.layers.83.input_layernorm.weight": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.0.down_proj.weight": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.0.down_proj.weight_scale": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.0.gate_proj.weight": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.0.gate_proj.weight_scale": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.0.up_proj.weight": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.0.up_proj.weight_scale": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.1.down_proj.weight": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.1.down_proj.weight_scale": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.1.gate_proj.weight": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.1.gate_proj.weight_scale": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.1.up_proj.weight": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.1.up_proj.weight_scale": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.10.down_proj.weight": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.10.down_proj.weight_scale": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.10.gate_proj.weight": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.10.gate_proj.weight_scale": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.10.up_proj.weight": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.10.up_proj.weight_scale": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.100.down_proj.weight": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.100.down_proj.weight_scale": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.100.gate_proj.weight": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.100.gate_proj.weight_scale": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.100.up_proj.weight": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.100.up_proj.weight_scale": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.101.down_proj.weight": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.101.down_proj.weight_scale": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.101.gate_proj.weight": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.101.gate_proj.weight_scale": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.101.up_proj.weight": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.101.up_proj.weight_scale": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.102.down_proj.weight": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.102.down_proj.weight_scale": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.102.gate_proj.weight": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.102.gate_proj.weight_scale": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.102.up_proj.weight": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.102.up_proj.weight_scale": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.103.down_proj.weight": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.103.down_proj.weight_scale": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.103.gate_proj.weight": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.103.gate_proj.weight_scale": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.103.up_proj.weight": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.103.up_proj.weight_scale": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.104.down_proj.weight": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.104.down_proj.weight_scale": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.104.gate_proj.weight": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.104.gate_proj.weight_scale": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.104.up_proj.weight": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.104.up_proj.weight_scale": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.105.down_proj.weight": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.105.down_proj.weight_scale": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.105.gate_proj.weight": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.105.gate_proj.weight_scale": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.105.up_proj.weight": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.105.up_proj.weight_scale": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.106.down_proj.weight": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.106.down_proj.weight_scale": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.106.gate_proj.weight": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.106.gate_proj.weight_scale": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.106.up_proj.weight": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.106.up_proj.weight_scale": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.107.down_proj.weight": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.107.down_proj.weight_scale": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.107.gate_proj.weight": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.107.gate_proj.weight_scale": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.107.up_proj.weight": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.107.up_proj.weight_scale": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.108.down_proj.weight": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.108.down_proj.weight_scale": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.108.gate_proj.weight": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.108.gate_proj.weight_scale": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.108.up_proj.weight": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.108.up_proj.weight_scale": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.109.down_proj.weight": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.109.down_proj.weight_scale": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.109.gate_proj.weight": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.109.gate_proj.weight_scale": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.109.up_proj.weight": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.109.up_proj.weight_scale": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.11.down_proj.weight": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.11.down_proj.weight_scale": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.11.gate_proj.weight": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.11.gate_proj.weight_scale": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.11.up_proj.weight": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.11.up_proj.weight_scale": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.110.down_proj.weight": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.110.down_proj.weight_scale": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.110.gate_proj.weight": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.110.gate_proj.weight_scale": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.110.up_proj.weight": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.110.up_proj.weight_scale": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.111.down_proj.weight": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.111.down_proj.weight_scale": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.111.gate_proj.weight": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.111.gate_proj.weight_scale": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.111.up_proj.weight": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.111.up_proj.weight_scale": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.112.down_proj.weight": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.112.down_proj.weight_scale": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.112.gate_proj.weight": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.112.gate_proj.weight_scale": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.112.up_proj.weight": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.112.up_proj.weight_scale": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.113.down_proj.weight": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.113.down_proj.weight_scale": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.113.gate_proj.weight": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.113.gate_proj.weight_scale": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.113.up_proj.weight": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.113.up_proj.weight_scale": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.114.down_proj.weight": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.114.down_proj.weight_scale": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.114.gate_proj.weight": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.114.gate_proj.weight_scale": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.114.up_proj.weight": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.114.up_proj.weight_scale": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.115.down_proj.weight": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.115.down_proj.weight_scale": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.115.gate_proj.weight": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.115.gate_proj.weight_scale": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.115.up_proj.weight": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.115.up_proj.weight_scale": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.116.down_proj.weight": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.116.down_proj.weight_scale": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.116.gate_proj.weight": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.116.gate_proj.weight_scale": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.116.up_proj.weight": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.116.up_proj.weight_scale": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.117.down_proj.weight": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.117.down_proj.weight_scale": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.117.gate_proj.weight": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.117.gate_proj.weight_scale": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.117.up_proj.weight": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.117.up_proj.weight_scale": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.118.down_proj.weight": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.118.down_proj.weight_scale": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.118.gate_proj.weight": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.118.gate_proj.weight_scale": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.118.up_proj.weight": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.118.up_proj.weight_scale": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.119.down_proj.weight": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.119.down_proj.weight_scale": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.119.gate_proj.weight": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.119.gate_proj.weight_scale": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.119.up_proj.weight": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.119.up_proj.weight_scale": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.12.down_proj.weight": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.12.down_proj.weight_scale": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.12.gate_proj.weight": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.12.gate_proj.weight_scale": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.12.up_proj.weight": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.12.up_proj.weight_scale": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.120.down_proj.weight": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.120.down_proj.weight_scale": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.120.gate_proj.weight": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.120.gate_proj.weight_scale": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.120.up_proj.weight": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.120.up_proj.weight_scale": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.121.down_proj.weight": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.121.down_proj.weight_scale": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.121.gate_proj.weight": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.121.gate_proj.weight_scale": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.121.up_proj.weight": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.121.up_proj.weight_scale": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.122.down_proj.weight": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.122.down_proj.weight_scale": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.122.gate_proj.weight": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.122.gate_proj.weight_scale": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.122.up_proj.weight": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.122.up_proj.weight_scale": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.123.down_proj.weight": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.123.down_proj.weight_scale": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.123.gate_proj.weight": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.123.gate_proj.weight_scale": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.123.up_proj.weight": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.123.up_proj.weight_scale": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.124.down_proj.weight": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.124.down_proj.weight_scale": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.124.gate_proj.weight": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.124.gate_proj.weight_scale": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.124.up_proj.weight": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.124.up_proj.weight_scale": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.125.down_proj.weight": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.125.down_proj.weight_scale": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.125.gate_proj.weight": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.125.gate_proj.weight_scale": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.125.up_proj.weight": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.125.up_proj.weight_scale": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.126.down_proj.weight": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.126.down_proj.weight_scale": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.126.gate_proj.weight": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.126.gate_proj.weight_scale": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.126.up_proj.weight": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.126.up_proj.weight_scale": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.127.down_proj.weight": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.127.down_proj.weight_scale": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.127.gate_proj.weight": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.127.gate_proj.weight_scale": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.127.up_proj.weight": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.127.up_proj.weight_scale": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.128.down_proj.weight": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.128.down_proj.weight_scale": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.128.gate_proj.weight": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.128.gate_proj.weight_scale": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.128.up_proj.weight": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.128.up_proj.weight_scale": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.129.down_proj.weight": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.129.down_proj.weight_scale": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.129.gate_proj.weight": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.129.gate_proj.weight_scale": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.129.up_proj.weight": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.129.up_proj.weight_scale": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.13.down_proj.weight": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.13.down_proj.weight_scale": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.13.gate_proj.weight": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.13.gate_proj.weight_scale": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.13.up_proj.weight": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.13.up_proj.weight_scale": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.130.down_proj.weight": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.130.down_proj.weight_scale": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.130.gate_proj.weight": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.130.gate_proj.weight_scale": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.130.up_proj.weight": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.130.up_proj.weight_scale": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.131.down_proj.weight": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.131.down_proj.weight_scale": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.131.gate_proj.weight": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.131.gate_proj.weight_scale": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.131.up_proj.weight": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.131.up_proj.weight_scale": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.132.down_proj.weight": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.132.down_proj.weight_scale": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.132.gate_proj.weight": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.132.gate_proj.weight_scale": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.132.up_proj.weight": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.132.up_proj.weight_scale": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.133.down_proj.weight": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.133.down_proj.weight_scale": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.133.gate_proj.weight": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.133.gate_proj.weight_scale": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.133.up_proj.weight": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.133.up_proj.weight_scale": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.134.down_proj.weight": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.134.down_proj.weight_scale": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.134.gate_proj.weight": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.134.gate_proj.weight_scale": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.134.up_proj.weight": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.134.up_proj.weight_scale": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.135.down_proj.weight": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.135.down_proj.weight_scale": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.135.gate_proj.weight": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.135.gate_proj.weight_scale": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.135.up_proj.weight": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.135.up_proj.weight_scale": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.136.down_proj.weight": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.136.down_proj.weight_scale": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.136.gate_proj.weight": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.136.gate_proj.weight_scale": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.136.up_proj.weight": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.136.up_proj.weight_scale": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.137.down_proj.weight": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.137.down_proj.weight_scale": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.137.gate_proj.weight": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.137.gate_proj.weight_scale": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.137.up_proj.weight": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.137.up_proj.weight_scale": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.138.down_proj.weight": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.138.down_proj.weight_scale": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.138.gate_proj.weight": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.138.gate_proj.weight_scale": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.138.up_proj.weight": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.138.up_proj.weight_scale": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.139.down_proj.weight": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.139.down_proj.weight_scale": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.139.gate_proj.weight": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.139.gate_proj.weight_scale": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.139.up_proj.weight": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.139.up_proj.weight_scale": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.14.down_proj.weight": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.14.down_proj.weight_scale": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.14.gate_proj.weight": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.14.gate_proj.weight_scale": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.14.up_proj.weight": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.14.up_proj.weight_scale": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.140.down_proj.weight": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.140.down_proj.weight_scale": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.140.gate_proj.weight": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.140.gate_proj.weight_scale": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.140.up_proj.weight": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.140.up_proj.weight_scale": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.141.down_proj.weight": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.141.down_proj.weight_scale": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.141.gate_proj.weight": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.141.gate_proj.weight_scale": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.141.up_proj.weight": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.141.up_proj.weight_scale": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.142.down_proj.weight": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.142.down_proj.weight_scale": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.142.gate_proj.weight": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.142.gate_proj.weight_scale": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.142.up_proj.weight": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.142.up_proj.weight_scale": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.143.down_proj.weight": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.143.down_proj.weight_scale": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.143.gate_proj.weight": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.143.gate_proj.weight_scale": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.143.up_proj.weight": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.143.up_proj.weight_scale": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.144.down_proj.weight": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.144.down_proj.weight_scale": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.144.gate_proj.weight": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.144.gate_proj.weight_scale": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.144.up_proj.weight": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.144.up_proj.weight_scale": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.145.down_proj.weight": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.145.down_proj.weight_scale": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.145.gate_proj.weight": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.145.gate_proj.weight_scale": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.145.up_proj.weight": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.145.up_proj.weight_scale": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.146.down_proj.weight": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.146.down_proj.weight_scale": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.146.gate_proj.weight": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.146.gate_proj.weight_scale": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.146.up_proj.weight": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.146.up_proj.weight_scale": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.147.down_proj.weight": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.147.down_proj.weight_scale": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.147.gate_proj.weight": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.147.gate_proj.weight_scale": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.147.up_proj.weight": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.147.up_proj.weight_scale": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.148.down_proj.weight": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.148.down_proj.weight_scale": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.148.gate_proj.weight": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.148.gate_proj.weight_scale": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.148.up_proj.weight": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.148.up_proj.weight_scale": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.149.down_proj.weight": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.149.down_proj.weight_scale": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.149.gate_proj.weight": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.149.gate_proj.weight_scale": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.149.up_proj.weight": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.149.up_proj.weight_scale": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.15.down_proj.weight": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.15.down_proj.weight_scale": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.15.gate_proj.weight": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.15.gate_proj.weight_scale": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.15.up_proj.weight": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.15.up_proj.weight_scale": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.150.down_proj.weight": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.150.down_proj.weight_scale": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.150.gate_proj.weight": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.150.gate_proj.weight_scale": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.150.up_proj.weight": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.150.up_proj.weight_scale": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.151.down_proj.weight": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.151.down_proj.weight_scale": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.151.gate_proj.weight": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.151.gate_proj.weight_scale": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.151.up_proj.weight": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.151.up_proj.weight_scale": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.152.down_proj.weight": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.152.down_proj.weight_scale": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.152.gate_proj.weight": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.152.gate_proj.weight_scale": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.152.up_proj.weight": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.152.up_proj.weight_scale": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.153.down_proj.weight": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.153.down_proj.weight_scale": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.153.gate_proj.weight": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.153.gate_proj.weight_scale": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.153.up_proj.weight": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.153.up_proj.weight_scale": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.154.down_proj.weight": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.154.down_proj.weight_scale": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.154.gate_proj.weight": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.154.gate_proj.weight_scale": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.154.up_proj.weight": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.154.up_proj.weight_scale": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.155.down_proj.weight": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.155.down_proj.weight_scale": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.155.gate_proj.weight": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.155.gate_proj.weight_scale": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.155.up_proj.weight": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.155.up_proj.weight_scale": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.156.down_proj.weight": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.156.down_proj.weight_scale": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.156.gate_proj.weight": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.156.gate_proj.weight_scale": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.156.up_proj.weight": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.156.up_proj.weight_scale": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.157.down_proj.weight": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.157.down_proj.weight_scale": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.157.gate_proj.weight": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.157.gate_proj.weight_scale": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.157.up_proj.weight": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.157.up_proj.weight_scale": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.158.down_proj.weight": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.158.down_proj.weight_scale": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.158.gate_proj.weight": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.158.gate_proj.weight_scale": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.158.up_proj.weight": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.158.up_proj.weight_scale": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.159.down_proj.weight": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.159.down_proj.weight_scale": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.159.gate_proj.weight": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.159.gate_proj.weight_scale": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.159.up_proj.weight": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.159.up_proj.weight_scale": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.16.down_proj.weight": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.16.down_proj.weight_scale": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.16.gate_proj.weight": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.16.gate_proj.weight_scale": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.16.up_proj.weight": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.16.up_proj.weight_scale": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.17.down_proj.weight": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.17.down_proj.weight_scale": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.17.gate_proj.weight": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.17.gate_proj.weight_scale": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.17.up_proj.weight": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.17.up_proj.weight_scale": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.18.down_proj.weight": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.18.down_proj.weight_scale": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.18.gate_proj.weight": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.18.gate_proj.weight_scale": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.18.up_proj.weight": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.18.up_proj.weight_scale": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.19.down_proj.weight": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.19.down_proj.weight_scale": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.19.gate_proj.weight": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.19.gate_proj.weight_scale": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.19.up_proj.weight": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.19.up_proj.weight_scale": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.2.down_proj.weight": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.2.down_proj.weight_scale": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.2.gate_proj.weight": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.2.gate_proj.weight_scale": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.2.up_proj.weight": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.2.up_proj.weight_scale": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.20.down_proj.weight": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.20.down_proj.weight_scale": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.20.gate_proj.weight": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.20.gate_proj.weight_scale": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.20.up_proj.weight": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.20.up_proj.weight_scale": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.21.down_proj.weight": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.21.down_proj.weight_scale": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.21.gate_proj.weight": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.21.gate_proj.weight_scale": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.21.up_proj.weight": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.21.up_proj.weight_scale": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.22.down_proj.weight": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.22.down_proj.weight_scale": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.22.gate_proj.weight": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.22.gate_proj.weight_scale": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.22.up_proj.weight": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.22.up_proj.weight_scale": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.23.down_proj.weight": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.23.down_proj.weight_scale": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.23.gate_proj.weight": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.23.gate_proj.weight_scale": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.23.up_proj.weight": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.23.up_proj.weight_scale": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.24.down_proj.weight": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.24.down_proj.weight_scale": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.24.gate_proj.weight": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.24.gate_proj.weight_scale": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.24.up_proj.weight": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.24.up_proj.weight_scale": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.25.down_proj.weight": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.25.down_proj.weight_scale": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.25.gate_proj.weight": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.25.gate_proj.weight_scale": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.25.up_proj.weight": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.25.up_proj.weight_scale": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.26.down_proj.weight": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.26.down_proj.weight_scale": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.26.gate_proj.weight": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.26.gate_proj.weight_scale": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.26.up_proj.weight": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.26.up_proj.weight_scale": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.27.down_proj.weight": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.27.down_proj.weight_scale": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.27.gate_proj.weight": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.27.gate_proj.weight_scale": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.27.up_proj.weight": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.27.up_proj.weight_scale": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.28.down_proj.weight": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.28.down_proj.weight_scale": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.28.gate_proj.weight": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.28.gate_proj.weight_scale": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.28.up_proj.weight": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.28.up_proj.weight_scale": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.29.down_proj.weight": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.29.down_proj.weight_scale": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.29.gate_proj.weight": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.29.gate_proj.weight_scale": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.29.up_proj.weight": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.29.up_proj.weight_scale": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.3.down_proj.weight": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.3.down_proj.weight_scale": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.3.gate_proj.weight": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.3.gate_proj.weight_scale": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.3.up_proj.weight": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.3.up_proj.weight_scale": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.30.down_proj.weight": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.30.down_proj.weight_scale": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.30.gate_proj.weight": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.30.gate_proj.weight_scale": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.30.up_proj.weight": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.30.up_proj.weight_scale": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.31.down_proj.weight": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.31.down_proj.weight_scale": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.31.gate_proj.weight": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.31.gate_proj.weight_scale": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.31.up_proj.weight": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.31.up_proj.weight_scale": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.32.down_proj.weight": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.32.down_proj.weight_scale": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.32.gate_proj.weight": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.32.gate_proj.weight_scale": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.32.up_proj.weight": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.32.up_proj.weight_scale": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.33.down_proj.weight": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.33.down_proj.weight_scale": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.33.gate_proj.weight": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.33.gate_proj.weight_scale": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.33.up_proj.weight": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.33.up_proj.weight_scale": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.34.down_proj.weight": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.34.down_proj.weight_scale": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.34.gate_proj.weight": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.34.gate_proj.weight_scale": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.34.up_proj.weight": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.34.up_proj.weight_scale": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.35.down_proj.weight": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.35.down_proj.weight_scale": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.35.gate_proj.weight": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.35.gate_proj.weight_scale": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.35.up_proj.weight": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.35.up_proj.weight_scale": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.36.down_proj.weight": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.36.down_proj.weight_scale": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.36.gate_proj.weight": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.36.gate_proj.weight_scale": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.36.up_proj.weight": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.36.up_proj.weight_scale": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.37.down_proj.weight": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.37.down_proj.weight_scale": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.37.gate_proj.weight": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.37.gate_proj.weight_scale": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.37.up_proj.weight": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.37.up_proj.weight_scale": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.38.down_proj.weight": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.38.down_proj.weight_scale": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.38.gate_proj.weight": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.38.gate_proj.weight_scale": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.38.up_proj.weight": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.38.up_proj.weight_scale": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.39.down_proj.weight": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.39.down_proj.weight_scale": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.39.gate_proj.weight": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.39.gate_proj.weight_scale": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.39.up_proj.weight": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.39.up_proj.weight_scale": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.4.down_proj.weight": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.4.down_proj.weight_scale": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.4.gate_proj.weight": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.4.gate_proj.weight_scale": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.4.up_proj.weight": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.4.up_proj.weight_scale": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.40.down_proj.weight": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.40.down_proj.weight_scale": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.40.gate_proj.weight": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.40.gate_proj.weight_scale": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.40.up_proj.weight": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.40.up_proj.weight_scale": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.41.down_proj.weight": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.41.down_proj.weight_scale": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.41.gate_proj.weight": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.41.gate_proj.weight_scale": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.41.up_proj.weight": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.41.up_proj.weight_scale": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.42.down_proj.weight": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.42.down_proj.weight_scale": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.42.gate_proj.weight": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.42.gate_proj.weight_scale": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.42.up_proj.weight": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.42.up_proj.weight_scale": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.43.down_proj.weight": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.43.down_proj.weight_scale": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.43.gate_proj.weight": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.43.gate_proj.weight_scale": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.43.up_proj.weight": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.43.up_proj.weight_scale": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.44.down_proj.weight": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.44.down_proj.weight_scale": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.44.gate_proj.weight": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.44.gate_proj.weight_scale": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.44.up_proj.weight": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.44.up_proj.weight_scale": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.45.down_proj.weight": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.45.down_proj.weight_scale": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.45.gate_proj.weight": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.45.gate_proj.weight_scale": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.45.up_proj.weight": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.45.up_proj.weight_scale": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.46.down_proj.weight": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.46.down_proj.weight_scale": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.46.gate_proj.weight": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.46.gate_proj.weight_scale": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.46.up_proj.weight": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.46.up_proj.weight_scale": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.47.down_proj.weight": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.47.down_proj.weight_scale": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.47.gate_proj.weight": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.47.gate_proj.weight_scale": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.47.up_proj.weight": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.47.up_proj.weight_scale": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.48.down_proj.weight": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.48.down_proj.weight_scale": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.48.gate_proj.weight": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.48.gate_proj.weight_scale": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.48.up_proj.weight": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.48.up_proj.weight_scale": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.49.down_proj.weight": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.49.down_proj.weight_scale": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.49.gate_proj.weight": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.49.gate_proj.weight_scale": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.49.up_proj.weight": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.49.up_proj.weight_scale": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.5.down_proj.weight": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.5.down_proj.weight_scale": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.5.gate_proj.weight": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.5.gate_proj.weight_scale": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.5.up_proj.weight": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.5.up_proj.weight_scale": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.50.down_proj.weight": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.50.down_proj.weight_scale": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.50.gate_proj.weight": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.50.gate_proj.weight_scale": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.50.up_proj.weight": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.50.up_proj.weight_scale": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.51.down_proj.weight": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.51.down_proj.weight_scale": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.51.gate_proj.weight": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.51.gate_proj.weight_scale": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.51.up_proj.weight": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.51.up_proj.weight_scale": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.52.down_proj.weight": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.52.down_proj.weight_scale": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.52.gate_proj.weight": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.52.gate_proj.weight_scale": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.52.up_proj.weight": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.52.up_proj.weight_scale": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.53.down_proj.weight": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.53.down_proj.weight_scale": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.53.gate_proj.weight": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.53.gate_proj.weight_scale": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.53.up_proj.weight": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.53.up_proj.weight_scale": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.54.down_proj.weight": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.54.down_proj.weight_scale": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.54.gate_proj.weight": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.54.gate_proj.weight_scale": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.54.up_proj.weight": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.54.up_proj.weight_scale": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.55.down_proj.weight": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.55.down_proj.weight_scale": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.55.gate_proj.weight": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.55.gate_proj.weight_scale": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.55.up_proj.weight": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.55.up_proj.weight_scale": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.56.down_proj.weight": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.56.down_proj.weight_scale": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.56.gate_proj.weight": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.56.gate_proj.weight_scale": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.56.up_proj.weight": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.56.up_proj.weight_scale": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.57.down_proj.weight": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.57.down_proj.weight_scale": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.57.gate_proj.weight": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.57.gate_proj.weight_scale": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.57.up_proj.weight": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.57.up_proj.weight_scale": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.58.down_proj.weight": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.58.down_proj.weight_scale": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.58.gate_proj.weight": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.58.gate_proj.weight_scale": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.58.up_proj.weight": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.58.up_proj.weight_scale": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.59.down_proj.weight": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.59.down_proj.weight_scale": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.59.gate_proj.weight": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.59.gate_proj.weight_scale": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.59.up_proj.weight": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.59.up_proj.weight_scale": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.6.down_proj.weight": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.6.down_proj.weight_scale": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.6.gate_proj.weight": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.6.gate_proj.weight_scale": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.6.up_proj.weight": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.6.up_proj.weight_scale": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.60.down_proj.weight": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.60.down_proj.weight_scale": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.60.gate_proj.weight": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.60.gate_proj.weight_scale": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.60.up_proj.weight": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.60.up_proj.weight_scale": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.61.down_proj.weight": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.61.down_proj.weight_scale": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.61.gate_proj.weight": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.61.gate_proj.weight_scale": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.61.up_proj.weight": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.61.up_proj.weight_scale": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.62.down_proj.weight": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.62.down_proj.weight_scale": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.62.gate_proj.weight": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.62.gate_proj.weight_scale": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.62.up_proj.weight": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.62.up_proj.weight_scale": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.63.down_proj.weight": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.63.down_proj.weight_scale": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.63.gate_proj.weight": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.63.gate_proj.weight_scale": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.63.up_proj.weight": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.63.up_proj.weight_scale": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.64.down_proj.weight": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.64.down_proj.weight_scale": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.64.gate_proj.weight": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.64.gate_proj.weight_scale": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.64.up_proj.weight": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.64.up_proj.weight_scale": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.65.down_proj.weight": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.65.down_proj.weight_scale": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.65.gate_proj.weight": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.65.gate_proj.weight_scale": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.65.up_proj.weight": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.65.up_proj.weight_scale": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.66.down_proj.weight": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.66.down_proj.weight_scale": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.66.gate_proj.weight": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.66.gate_proj.weight_scale": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.66.up_proj.weight": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.66.up_proj.weight_scale": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.67.down_proj.weight": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.67.down_proj.weight_scale": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.67.gate_proj.weight": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.67.gate_proj.weight_scale": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.67.up_proj.weight": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.67.up_proj.weight_scale": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.68.down_proj.weight": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.68.down_proj.weight_scale": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.68.gate_proj.weight": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.68.gate_proj.weight_scale": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.68.up_proj.weight": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.68.up_proj.weight_scale": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.69.down_proj.weight": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.69.down_proj.weight_scale": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.69.gate_proj.weight": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.69.gate_proj.weight_scale": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.69.up_proj.weight": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.69.up_proj.weight_scale": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.7.down_proj.weight": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.7.down_proj.weight_scale": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.7.gate_proj.weight": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.7.gate_proj.weight_scale": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.7.up_proj.weight": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.7.up_proj.weight_scale": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.70.down_proj.weight": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.70.down_proj.weight_scale": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.70.gate_proj.weight": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.70.gate_proj.weight_scale": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.70.up_proj.weight": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.70.up_proj.weight_scale": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.71.down_proj.weight": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.71.down_proj.weight_scale": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.71.gate_proj.weight": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.71.gate_proj.weight_scale": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.71.up_proj.weight": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.71.up_proj.weight_scale": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.72.down_proj.weight": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.72.down_proj.weight_scale": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.72.gate_proj.weight": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.72.gate_proj.weight_scale": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.72.up_proj.weight": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.72.up_proj.weight_scale": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.73.down_proj.weight": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.73.down_proj.weight_scale": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.73.gate_proj.weight": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.73.gate_proj.weight_scale": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.73.up_proj.weight": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.73.up_proj.weight_scale": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.74.down_proj.weight": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.74.down_proj.weight_scale": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.74.gate_proj.weight": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.74.gate_proj.weight_scale": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.74.up_proj.weight": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.74.up_proj.weight_scale": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.75.down_proj.weight": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.75.down_proj.weight_scale": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.75.gate_proj.weight": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.75.gate_proj.weight_scale": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.75.up_proj.weight": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.75.up_proj.weight_scale": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.76.down_proj.weight": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.76.down_proj.weight_scale": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.76.gate_proj.weight": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.76.gate_proj.weight_scale": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.76.up_proj.weight": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.76.up_proj.weight_scale": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.77.down_proj.weight": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.77.down_proj.weight_scale": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.77.gate_proj.weight": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.77.gate_proj.weight_scale": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.77.up_proj.weight": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.77.up_proj.weight_scale": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.78.down_proj.weight": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.78.down_proj.weight_scale": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.78.gate_proj.weight": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.78.gate_proj.weight_scale": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.78.up_proj.weight": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.78.up_proj.weight_scale": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.79.down_proj.weight": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.79.down_proj.weight_scale": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.79.gate_proj.weight": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.79.gate_proj.weight_scale": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.79.up_proj.weight": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.79.up_proj.weight_scale": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.8.down_proj.weight": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.8.down_proj.weight_scale": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.8.gate_proj.weight": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.8.gate_proj.weight_scale": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.8.up_proj.weight": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.8.up_proj.weight_scale": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.80.down_proj.weight": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.80.down_proj.weight_scale": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.80.gate_proj.weight": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.80.gate_proj.weight_scale": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.80.up_proj.weight": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.80.up_proj.weight_scale": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.81.down_proj.weight": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.81.down_proj.weight_scale": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.81.gate_proj.weight": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.81.gate_proj.weight_scale": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.81.up_proj.weight": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.81.up_proj.weight_scale": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.82.down_proj.weight": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.82.down_proj.weight_scale": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.82.gate_proj.weight": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.82.gate_proj.weight_scale": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.82.up_proj.weight": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.82.up_proj.weight_scale": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.83.down_proj.weight": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.83.down_proj.weight_scale": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.83.gate_proj.weight": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.83.gate_proj.weight_scale": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.83.up_proj.weight": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.83.up_proj.weight_scale": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.84.down_proj.weight": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.84.down_proj.weight_scale": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.84.gate_proj.weight": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.84.gate_proj.weight_scale": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.84.up_proj.weight": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.84.up_proj.weight_scale": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.85.down_proj.weight": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.85.down_proj.weight_scale": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.85.gate_proj.weight": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.85.gate_proj.weight_scale": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.85.up_proj.weight": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.85.up_proj.weight_scale": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.86.down_proj.weight": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.86.down_proj.weight_scale": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.86.gate_proj.weight": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.86.gate_proj.weight_scale": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.86.up_proj.weight": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.86.up_proj.weight_scale": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.87.down_proj.weight": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.87.down_proj.weight_scale": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.87.gate_proj.weight": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.87.gate_proj.weight_scale": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.87.up_proj.weight": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.87.up_proj.weight_scale": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.88.down_proj.weight": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.88.down_proj.weight_scale": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.88.gate_proj.weight": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.88.gate_proj.weight_scale": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.88.up_proj.weight": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.88.up_proj.weight_scale": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.89.down_proj.weight": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.89.down_proj.weight_scale": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.89.gate_proj.weight": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.89.gate_proj.weight_scale": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.89.up_proj.weight": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.89.up_proj.weight_scale": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.9.down_proj.weight": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.9.down_proj.weight_scale": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.9.gate_proj.weight": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.9.gate_proj.weight_scale": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.9.up_proj.weight": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.9.up_proj.weight_scale": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.90.down_proj.weight": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.90.down_proj.weight_scale": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.90.gate_proj.weight": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.90.gate_proj.weight_scale": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.90.up_proj.weight": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.90.up_proj.weight_scale": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.91.down_proj.weight": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.91.down_proj.weight_scale": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.91.gate_proj.weight": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.91.gate_proj.weight_scale": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.91.up_proj.weight": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.91.up_proj.weight_scale": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.92.down_proj.weight": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.92.down_proj.weight_scale": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.92.gate_proj.weight": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.92.gate_proj.weight_scale": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.92.up_proj.weight": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.92.up_proj.weight_scale": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.93.down_proj.weight": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.93.down_proj.weight_scale": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.93.gate_proj.weight": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.93.gate_proj.weight_scale": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.93.up_proj.weight": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.93.up_proj.weight_scale": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.94.down_proj.weight": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.94.down_proj.weight_scale": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.94.gate_proj.weight": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.94.gate_proj.weight_scale": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.94.up_proj.weight": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.94.up_proj.weight_scale": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.95.down_proj.weight": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.95.down_proj.weight_scale": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.95.gate_proj.weight": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.95.gate_proj.weight_scale": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.95.up_proj.weight": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.95.up_proj.weight_scale": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.96.down_proj.weight": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.96.down_proj.weight_scale": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.96.gate_proj.weight": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.96.gate_proj.weight_scale": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.96.up_proj.weight": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.96.up_proj.weight_scale": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.97.down_proj.weight": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.97.down_proj.weight_scale": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.97.gate_proj.weight": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.97.gate_proj.weight_scale": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.97.up_proj.weight": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.97.up_proj.weight_scale": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.98.down_proj.weight": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.98.down_proj.weight_scale": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.98.gate_proj.weight": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.98.gate_proj.weight_scale": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.98.up_proj.weight": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.98.up_proj.weight_scale": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.99.down_proj.weight": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.99.down_proj.weight_scale": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.99.gate_proj.weight": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.99.gate_proj.weight_scale": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.99.up_proj.weight": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.99.up_proj.weight_scale": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.gate.e_score_correction_bias": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.gate.weight": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.shared_experts.down_proj.weight": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.shared_experts.down_proj.weight_scale": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.shared_experts.gate_proj.weight": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.shared_experts.gate_proj.weight_scale": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.shared_experts.up_proj.weight": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.shared_experts.up_proj.weight_scale": "model-00084-of-00092.safetensors",
+ "model.layers.83.post_attention_layernorm.weight": "model-00084-of-00092.safetensors",
+ "model.layers.83.self_attn.k_norm.weight": "model-00084-of-00092.safetensors",
+ "model.layers.83.self_attn.k_proj.bias": "model-00084-of-00092.safetensors",
+ "model.layers.83.self_attn.k_proj.weight": "model-00084-of-00092.safetensors",
+ "model.layers.83.self_attn.k_proj.weight_scale": "model-00084-of-00092.safetensors",
+ "model.layers.83.self_attn.o_proj.weight": "model-00084-of-00092.safetensors",
+ "model.layers.83.self_attn.o_proj.weight_scale": "model-00084-of-00092.safetensors",
+ "model.layers.83.self_attn.q_norm.weight": "model-00084-of-00092.safetensors",
+ "model.layers.83.self_attn.q_proj.bias": "model-00084-of-00092.safetensors",
+ "model.layers.83.self_attn.q_proj.weight": "model-00084-of-00092.safetensors",
+ "model.layers.83.self_attn.q_proj.weight_scale": "model-00084-of-00092.safetensors",
+ "model.layers.83.self_attn.v_proj.bias": "model-00084-of-00092.safetensors",
+ "model.layers.83.self_attn.v_proj.weight": "model-00084-of-00092.safetensors",
+ "model.layers.83.self_attn.v_proj.weight_scale": "model-00084-of-00092.safetensors",
+ "model.layers.84.input_layernorm.weight": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.0.down_proj.weight": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.0.down_proj.weight_scale": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.0.gate_proj.weight": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.0.gate_proj.weight_scale": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.0.up_proj.weight": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.0.up_proj.weight_scale": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.1.down_proj.weight": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.1.down_proj.weight_scale": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.1.gate_proj.weight": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.1.gate_proj.weight_scale": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.1.up_proj.weight": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.1.up_proj.weight_scale": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.10.down_proj.weight": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.10.down_proj.weight_scale": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.10.gate_proj.weight": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.10.gate_proj.weight_scale": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.10.up_proj.weight": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.10.up_proj.weight_scale": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.100.down_proj.weight": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.100.down_proj.weight_scale": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.100.gate_proj.weight": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.100.gate_proj.weight_scale": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.100.up_proj.weight": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.100.up_proj.weight_scale": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.101.down_proj.weight": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.101.down_proj.weight_scale": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.101.gate_proj.weight": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.101.gate_proj.weight_scale": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.101.up_proj.weight": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.101.up_proj.weight_scale": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.102.down_proj.weight": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.102.down_proj.weight_scale": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.102.gate_proj.weight": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.102.gate_proj.weight_scale": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.102.up_proj.weight": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.102.up_proj.weight_scale": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.103.down_proj.weight": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.103.down_proj.weight_scale": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.103.gate_proj.weight": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.103.gate_proj.weight_scale": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.103.up_proj.weight": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.103.up_proj.weight_scale": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.104.down_proj.weight": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.104.down_proj.weight_scale": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.104.gate_proj.weight": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.104.gate_proj.weight_scale": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.104.up_proj.weight": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.104.up_proj.weight_scale": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.105.down_proj.weight": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.105.down_proj.weight_scale": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.105.gate_proj.weight": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.105.gate_proj.weight_scale": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.105.up_proj.weight": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.105.up_proj.weight_scale": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.106.down_proj.weight": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.106.down_proj.weight_scale": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.106.gate_proj.weight": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.106.gate_proj.weight_scale": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.106.up_proj.weight": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.106.up_proj.weight_scale": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.107.down_proj.weight": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.107.down_proj.weight_scale": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.107.gate_proj.weight": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.107.gate_proj.weight_scale": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.107.up_proj.weight": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.107.up_proj.weight_scale": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.108.down_proj.weight": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.108.down_proj.weight_scale": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.108.gate_proj.weight": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.108.gate_proj.weight_scale": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.108.up_proj.weight": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.108.up_proj.weight_scale": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.109.down_proj.weight": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.109.down_proj.weight_scale": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.109.gate_proj.weight": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.109.gate_proj.weight_scale": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.109.up_proj.weight": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.109.up_proj.weight_scale": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.11.down_proj.weight": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.11.down_proj.weight_scale": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.11.gate_proj.weight": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.11.gate_proj.weight_scale": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.11.up_proj.weight": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.11.up_proj.weight_scale": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.110.down_proj.weight": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.110.down_proj.weight_scale": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.110.gate_proj.weight": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.110.gate_proj.weight_scale": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.110.up_proj.weight": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.110.up_proj.weight_scale": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.111.down_proj.weight": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.111.down_proj.weight_scale": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.111.gate_proj.weight": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.111.gate_proj.weight_scale": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.111.up_proj.weight": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.111.up_proj.weight_scale": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.112.down_proj.weight": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.112.down_proj.weight_scale": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.112.gate_proj.weight": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.112.gate_proj.weight_scale": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.112.up_proj.weight": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.112.up_proj.weight_scale": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.113.down_proj.weight": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.113.down_proj.weight_scale": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.113.gate_proj.weight": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.113.gate_proj.weight_scale": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.113.up_proj.weight": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.113.up_proj.weight_scale": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.114.down_proj.weight": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.114.down_proj.weight_scale": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.114.gate_proj.weight": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.114.gate_proj.weight_scale": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.114.up_proj.weight": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.114.up_proj.weight_scale": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.115.down_proj.weight": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.115.down_proj.weight_scale": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.115.gate_proj.weight": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.115.gate_proj.weight_scale": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.115.up_proj.weight": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.115.up_proj.weight_scale": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.116.down_proj.weight": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.116.down_proj.weight_scale": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.116.gate_proj.weight": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.116.gate_proj.weight_scale": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.116.up_proj.weight": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.116.up_proj.weight_scale": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.117.down_proj.weight": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.117.down_proj.weight_scale": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.117.gate_proj.weight": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.117.gate_proj.weight_scale": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.117.up_proj.weight": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.117.up_proj.weight_scale": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.118.down_proj.weight": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.118.down_proj.weight_scale": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.118.gate_proj.weight": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.118.gate_proj.weight_scale": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.118.up_proj.weight": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.118.up_proj.weight_scale": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.119.down_proj.weight": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.119.down_proj.weight_scale": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.119.gate_proj.weight": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.119.gate_proj.weight_scale": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.119.up_proj.weight": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.119.up_proj.weight_scale": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.12.down_proj.weight": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.12.down_proj.weight_scale": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.12.gate_proj.weight": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.12.gate_proj.weight_scale": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.12.up_proj.weight": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.12.up_proj.weight_scale": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.120.down_proj.weight": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.120.down_proj.weight_scale": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.120.gate_proj.weight": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.120.gate_proj.weight_scale": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.120.up_proj.weight": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.120.up_proj.weight_scale": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.121.down_proj.weight": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.121.down_proj.weight_scale": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.121.gate_proj.weight": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.121.gate_proj.weight_scale": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.121.up_proj.weight": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.121.up_proj.weight_scale": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.122.down_proj.weight": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.122.down_proj.weight_scale": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.122.gate_proj.weight": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.122.gate_proj.weight_scale": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.122.up_proj.weight": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.122.up_proj.weight_scale": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.123.down_proj.weight": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.123.down_proj.weight_scale": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.123.gate_proj.weight": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.123.gate_proj.weight_scale": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.123.up_proj.weight": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.123.up_proj.weight_scale": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.124.down_proj.weight": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.124.down_proj.weight_scale": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.124.gate_proj.weight": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.124.gate_proj.weight_scale": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.124.up_proj.weight": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.124.up_proj.weight_scale": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.125.down_proj.weight": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.125.down_proj.weight_scale": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.125.gate_proj.weight": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.125.gate_proj.weight_scale": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.125.up_proj.weight": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.125.up_proj.weight_scale": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.126.down_proj.weight": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.126.down_proj.weight_scale": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.126.gate_proj.weight": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.126.gate_proj.weight_scale": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.126.up_proj.weight": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.126.up_proj.weight_scale": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.127.down_proj.weight": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.127.down_proj.weight_scale": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.127.gate_proj.weight": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.127.gate_proj.weight_scale": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.127.up_proj.weight": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.127.up_proj.weight_scale": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.128.down_proj.weight": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.128.down_proj.weight_scale": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.128.gate_proj.weight": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.128.gate_proj.weight_scale": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.128.up_proj.weight": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.128.up_proj.weight_scale": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.129.down_proj.weight": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.129.down_proj.weight_scale": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.129.gate_proj.weight": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.129.gate_proj.weight_scale": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.129.up_proj.weight": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.129.up_proj.weight_scale": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.13.down_proj.weight": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.13.down_proj.weight_scale": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.13.gate_proj.weight": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.13.gate_proj.weight_scale": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.13.up_proj.weight": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.13.up_proj.weight_scale": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.130.down_proj.weight": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.130.down_proj.weight_scale": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.130.gate_proj.weight": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.130.gate_proj.weight_scale": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.130.up_proj.weight": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.130.up_proj.weight_scale": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.131.down_proj.weight": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.131.down_proj.weight_scale": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.131.gate_proj.weight": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.131.gate_proj.weight_scale": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.131.up_proj.weight": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.131.up_proj.weight_scale": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.132.down_proj.weight": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.132.down_proj.weight_scale": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.132.gate_proj.weight": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.132.gate_proj.weight_scale": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.132.up_proj.weight": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.132.up_proj.weight_scale": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.133.down_proj.weight": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.133.down_proj.weight_scale": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.133.gate_proj.weight": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.133.gate_proj.weight_scale": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.133.up_proj.weight": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.133.up_proj.weight_scale": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.134.down_proj.weight": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.134.down_proj.weight_scale": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.134.gate_proj.weight": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.134.gate_proj.weight_scale": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.134.up_proj.weight": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.134.up_proj.weight_scale": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.135.down_proj.weight": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.135.down_proj.weight_scale": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.135.gate_proj.weight": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.135.gate_proj.weight_scale": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.135.up_proj.weight": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.135.up_proj.weight_scale": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.136.down_proj.weight": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.136.down_proj.weight_scale": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.136.gate_proj.weight": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.136.gate_proj.weight_scale": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.136.up_proj.weight": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.136.up_proj.weight_scale": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.137.down_proj.weight": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.137.down_proj.weight_scale": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.137.gate_proj.weight": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.137.gate_proj.weight_scale": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.137.up_proj.weight": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.137.up_proj.weight_scale": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.138.down_proj.weight": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.138.down_proj.weight_scale": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.138.gate_proj.weight": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.138.gate_proj.weight_scale": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.138.up_proj.weight": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.138.up_proj.weight_scale": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.139.down_proj.weight": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.139.down_proj.weight_scale": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.139.gate_proj.weight": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.139.gate_proj.weight_scale": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.139.up_proj.weight": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.139.up_proj.weight_scale": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.14.down_proj.weight": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.14.down_proj.weight_scale": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.14.gate_proj.weight": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.14.gate_proj.weight_scale": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.14.up_proj.weight": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.14.up_proj.weight_scale": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.140.down_proj.weight": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.140.down_proj.weight_scale": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.140.gate_proj.weight": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.140.gate_proj.weight_scale": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.140.up_proj.weight": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.140.up_proj.weight_scale": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.141.down_proj.weight": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.141.down_proj.weight_scale": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.141.gate_proj.weight": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.141.gate_proj.weight_scale": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.141.up_proj.weight": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.141.up_proj.weight_scale": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.142.down_proj.weight": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.142.down_proj.weight_scale": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.142.gate_proj.weight": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.142.gate_proj.weight_scale": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.142.up_proj.weight": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.142.up_proj.weight_scale": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.143.down_proj.weight": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.143.down_proj.weight_scale": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.143.gate_proj.weight": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.143.gate_proj.weight_scale": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.143.up_proj.weight": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.143.up_proj.weight_scale": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.144.down_proj.weight": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.144.down_proj.weight_scale": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.144.gate_proj.weight": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.144.gate_proj.weight_scale": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.144.up_proj.weight": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.144.up_proj.weight_scale": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.145.down_proj.weight": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.145.down_proj.weight_scale": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.145.gate_proj.weight": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.145.gate_proj.weight_scale": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.145.up_proj.weight": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.145.up_proj.weight_scale": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.146.down_proj.weight": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.146.down_proj.weight_scale": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.146.gate_proj.weight": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.146.gate_proj.weight_scale": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.146.up_proj.weight": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.146.up_proj.weight_scale": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.147.down_proj.weight": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.147.down_proj.weight_scale": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.147.gate_proj.weight": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.147.gate_proj.weight_scale": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.147.up_proj.weight": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.147.up_proj.weight_scale": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.148.down_proj.weight": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.148.down_proj.weight_scale": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.148.gate_proj.weight": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.148.gate_proj.weight_scale": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.148.up_proj.weight": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.148.up_proj.weight_scale": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.149.down_proj.weight": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.149.down_proj.weight_scale": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.149.gate_proj.weight": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.149.gate_proj.weight_scale": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.149.up_proj.weight": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.149.up_proj.weight_scale": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.15.down_proj.weight": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.15.down_proj.weight_scale": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.15.gate_proj.weight": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.15.gate_proj.weight_scale": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.15.up_proj.weight": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.15.up_proj.weight_scale": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.150.down_proj.weight": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.150.down_proj.weight_scale": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.150.gate_proj.weight": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.150.gate_proj.weight_scale": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.150.up_proj.weight": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.150.up_proj.weight_scale": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.151.down_proj.weight": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.151.down_proj.weight_scale": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.151.gate_proj.weight": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.151.gate_proj.weight_scale": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.151.up_proj.weight": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.151.up_proj.weight_scale": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.152.down_proj.weight": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.152.down_proj.weight_scale": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.152.gate_proj.weight": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.152.gate_proj.weight_scale": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.152.up_proj.weight": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.152.up_proj.weight_scale": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.153.down_proj.weight": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.153.down_proj.weight_scale": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.153.gate_proj.weight": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.153.gate_proj.weight_scale": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.153.up_proj.weight": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.153.up_proj.weight_scale": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.154.down_proj.weight": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.154.down_proj.weight_scale": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.154.gate_proj.weight": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.154.gate_proj.weight_scale": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.154.up_proj.weight": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.154.up_proj.weight_scale": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.155.down_proj.weight": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.155.down_proj.weight_scale": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.155.gate_proj.weight": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.155.gate_proj.weight_scale": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.155.up_proj.weight": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.155.up_proj.weight_scale": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.156.down_proj.weight": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.156.down_proj.weight_scale": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.156.gate_proj.weight": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.156.gate_proj.weight_scale": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.156.up_proj.weight": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.156.up_proj.weight_scale": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.157.down_proj.weight": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.157.down_proj.weight_scale": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.157.gate_proj.weight": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.157.gate_proj.weight_scale": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.157.up_proj.weight": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.157.up_proj.weight_scale": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.158.down_proj.weight": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.158.down_proj.weight_scale": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.158.gate_proj.weight": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.158.gate_proj.weight_scale": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.158.up_proj.weight": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.158.up_proj.weight_scale": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.159.down_proj.weight": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.159.down_proj.weight_scale": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.159.gate_proj.weight": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.159.gate_proj.weight_scale": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.159.up_proj.weight": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.159.up_proj.weight_scale": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.16.down_proj.weight": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.16.down_proj.weight_scale": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.16.gate_proj.weight": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.16.gate_proj.weight_scale": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.16.up_proj.weight": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.16.up_proj.weight_scale": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.17.down_proj.weight": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.17.down_proj.weight_scale": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.17.gate_proj.weight": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.17.gate_proj.weight_scale": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.17.up_proj.weight": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.17.up_proj.weight_scale": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.18.down_proj.weight": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.18.down_proj.weight_scale": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.18.gate_proj.weight": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.18.gate_proj.weight_scale": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.18.up_proj.weight": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.18.up_proj.weight_scale": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.19.down_proj.weight": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.19.down_proj.weight_scale": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.19.gate_proj.weight": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.19.gate_proj.weight_scale": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.19.up_proj.weight": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.19.up_proj.weight_scale": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.2.down_proj.weight": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.2.down_proj.weight_scale": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.2.gate_proj.weight": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.2.gate_proj.weight_scale": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.2.up_proj.weight": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.2.up_proj.weight_scale": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.20.down_proj.weight": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.20.down_proj.weight_scale": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.20.gate_proj.weight": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.20.gate_proj.weight_scale": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.20.up_proj.weight": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.20.up_proj.weight_scale": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.21.down_proj.weight": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.21.down_proj.weight_scale": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.21.gate_proj.weight": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.21.gate_proj.weight_scale": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.21.up_proj.weight": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.21.up_proj.weight_scale": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.22.down_proj.weight": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.22.down_proj.weight_scale": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.22.gate_proj.weight": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.22.gate_proj.weight_scale": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.22.up_proj.weight": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.22.up_proj.weight_scale": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.23.down_proj.weight": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.23.down_proj.weight_scale": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.23.gate_proj.weight": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.23.gate_proj.weight_scale": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.23.up_proj.weight": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.23.up_proj.weight_scale": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.24.down_proj.weight": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.24.down_proj.weight_scale": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.24.gate_proj.weight": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.24.gate_proj.weight_scale": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.24.up_proj.weight": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.24.up_proj.weight_scale": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.25.down_proj.weight": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.25.down_proj.weight_scale": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.25.gate_proj.weight": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.25.gate_proj.weight_scale": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.25.up_proj.weight": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.25.up_proj.weight_scale": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.26.down_proj.weight": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.26.down_proj.weight_scale": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.26.gate_proj.weight": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.26.gate_proj.weight_scale": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.26.up_proj.weight": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.26.up_proj.weight_scale": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.27.down_proj.weight": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.27.down_proj.weight_scale": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.27.gate_proj.weight": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.27.gate_proj.weight_scale": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.27.up_proj.weight": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.27.up_proj.weight_scale": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.28.down_proj.weight": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.28.down_proj.weight_scale": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.28.gate_proj.weight": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.28.gate_proj.weight_scale": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.28.up_proj.weight": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.28.up_proj.weight_scale": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.29.down_proj.weight": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.29.down_proj.weight_scale": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.29.gate_proj.weight": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.29.gate_proj.weight_scale": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.29.up_proj.weight": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.29.up_proj.weight_scale": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.3.down_proj.weight": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.3.down_proj.weight_scale": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.3.gate_proj.weight": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.3.gate_proj.weight_scale": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.3.up_proj.weight": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.3.up_proj.weight_scale": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.30.down_proj.weight": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.30.down_proj.weight_scale": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.30.gate_proj.weight": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.30.gate_proj.weight_scale": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.30.up_proj.weight": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.30.up_proj.weight_scale": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.31.down_proj.weight": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.31.down_proj.weight_scale": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.31.gate_proj.weight": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.31.gate_proj.weight_scale": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.31.up_proj.weight": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.31.up_proj.weight_scale": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.32.down_proj.weight": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.32.down_proj.weight_scale": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.32.gate_proj.weight": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.32.gate_proj.weight_scale": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.32.up_proj.weight": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.32.up_proj.weight_scale": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.33.down_proj.weight": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.33.down_proj.weight_scale": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.33.gate_proj.weight": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.33.gate_proj.weight_scale": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.33.up_proj.weight": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.33.up_proj.weight_scale": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.34.down_proj.weight": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.34.down_proj.weight_scale": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.34.gate_proj.weight": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.34.gate_proj.weight_scale": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.34.up_proj.weight": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.34.up_proj.weight_scale": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.35.down_proj.weight": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.35.down_proj.weight_scale": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.35.gate_proj.weight": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.35.gate_proj.weight_scale": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.35.up_proj.weight": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.35.up_proj.weight_scale": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.36.down_proj.weight": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.36.down_proj.weight_scale": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.36.gate_proj.weight": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.36.gate_proj.weight_scale": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.36.up_proj.weight": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.36.up_proj.weight_scale": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.37.down_proj.weight": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.37.down_proj.weight_scale": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.37.gate_proj.weight": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.37.gate_proj.weight_scale": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.37.up_proj.weight": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.37.up_proj.weight_scale": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.38.down_proj.weight": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.38.down_proj.weight_scale": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.38.gate_proj.weight": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.38.gate_proj.weight_scale": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.38.up_proj.weight": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.38.up_proj.weight_scale": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.39.down_proj.weight": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.39.down_proj.weight_scale": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.39.gate_proj.weight": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.39.gate_proj.weight_scale": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.39.up_proj.weight": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.39.up_proj.weight_scale": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.4.down_proj.weight": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.4.down_proj.weight_scale": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.4.gate_proj.weight": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.4.gate_proj.weight_scale": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.4.up_proj.weight": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.4.up_proj.weight_scale": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.40.down_proj.weight": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.40.down_proj.weight_scale": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.40.gate_proj.weight": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.40.gate_proj.weight_scale": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.40.up_proj.weight": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.40.up_proj.weight_scale": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.41.down_proj.weight": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.41.down_proj.weight_scale": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.41.gate_proj.weight": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.41.gate_proj.weight_scale": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.41.up_proj.weight": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.41.up_proj.weight_scale": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.42.down_proj.weight": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.42.down_proj.weight_scale": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.42.gate_proj.weight": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.42.gate_proj.weight_scale": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.42.up_proj.weight": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.42.up_proj.weight_scale": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.43.down_proj.weight": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.43.down_proj.weight_scale": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.43.gate_proj.weight": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.43.gate_proj.weight_scale": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.43.up_proj.weight": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.43.up_proj.weight_scale": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.44.down_proj.weight": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.44.down_proj.weight_scale": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.44.gate_proj.weight": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.44.gate_proj.weight_scale": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.44.up_proj.weight": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.44.up_proj.weight_scale": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.45.down_proj.weight": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.45.down_proj.weight_scale": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.45.gate_proj.weight": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.45.gate_proj.weight_scale": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.45.up_proj.weight": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.45.up_proj.weight_scale": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.46.down_proj.weight": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.46.down_proj.weight_scale": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.46.gate_proj.weight": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.46.gate_proj.weight_scale": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.46.up_proj.weight": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.46.up_proj.weight_scale": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.47.down_proj.weight": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.47.down_proj.weight_scale": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.47.gate_proj.weight": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.47.gate_proj.weight_scale": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.47.up_proj.weight": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.47.up_proj.weight_scale": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.48.down_proj.weight": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.48.down_proj.weight_scale": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.48.gate_proj.weight": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.48.gate_proj.weight_scale": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.48.up_proj.weight": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.48.up_proj.weight_scale": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.49.down_proj.weight": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.49.down_proj.weight_scale": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.49.gate_proj.weight": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.49.gate_proj.weight_scale": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.49.up_proj.weight": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.49.up_proj.weight_scale": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.5.down_proj.weight": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.5.down_proj.weight_scale": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.5.gate_proj.weight": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.5.gate_proj.weight_scale": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.5.up_proj.weight": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.5.up_proj.weight_scale": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.50.down_proj.weight": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.50.down_proj.weight_scale": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.50.gate_proj.weight": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.50.gate_proj.weight_scale": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.50.up_proj.weight": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.50.up_proj.weight_scale": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.51.down_proj.weight": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.51.down_proj.weight_scale": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.51.gate_proj.weight": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.51.gate_proj.weight_scale": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.51.up_proj.weight": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.51.up_proj.weight_scale": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.52.down_proj.weight": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.52.down_proj.weight_scale": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.52.gate_proj.weight": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.52.gate_proj.weight_scale": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.52.up_proj.weight": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.52.up_proj.weight_scale": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.53.down_proj.weight": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.53.down_proj.weight_scale": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.53.gate_proj.weight": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.53.gate_proj.weight_scale": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.53.up_proj.weight": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.53.up_proj.weight_scale": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.54.down_proj.weight": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.54.down_proj.weight_scale": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.54.gate_proj.weight": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.54.gate_proj.weight_scale": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.54.up_proj.weight": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.54.up_proj.weight_scale": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.55.down_proj.weight": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.55.down_proj.weight_scale": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.55.gate_proj.weight": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.55.gate_proj.weight_scale": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.55.up_proj.weight": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.55.up_proj.weight_scale": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.56.down_proj.weight": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.56.down_proj.weight_scale": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.56.gate_proj.weight": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.56.gate_proj.weight_scale": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.56.up_proj.weight": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.56.up_proj.weight_scale": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.57.down_proj.weight": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.57.down_proj.weight_scale": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.57.gate_proj.weight": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.57.gate_proj.weight_scale": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.57.up_proj.weight": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.57.up_proj.weight_scale": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.58.down_proj.weight": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.58.down_proj.weight_scale": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.58.gate_proj.weight": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.58.gate_proj.weight_scale": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.58.up_proj.weight": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.58.up_proj.weight_scale": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.59.down_proj.weight": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.59.down_proj.weight_scale": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.59.gate_proj.weight": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.59.gate_proj.weight_scale": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.59.up_proj.weight": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.59.up_proj.weight_scale": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.6.down_proj.weight": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.6.down_proj.weight_scale": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.6.gate_proj.weight": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.6.gate_proj.weight_scale": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.6.up_proj.weight": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.6.up_proj.weight_scale": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.60.down_proj.weight": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.60.down_proj.weight_scale": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.60.gate_proj.weight": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.60.gate_proj.weight_scale": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.60.up_proj.weight": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.60.up_proj.weight_scale": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.61.down_proj.weight": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.61.down_proj.weight_scale": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.61.gate_proj.weight": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.61.gate_proj.weight_scale": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.61.up_proj.weight": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.61.up_proj.weight_scale": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.62.down_proj.weight": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.62.down_proj.weight_scale": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.62.gate_proj.weight": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.62.gate_proj.weight_scale": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.62.up_proj.weight": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.62.up_proj.weight_scale": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.63.down_proj.weight": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.63.down_proj.weight_scale": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.63.gate_proj.weight": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.63.gate_proj.weight_scale": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.63.up_proj.weight": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.63.up_proj.weight_scale": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.64.down_proj.weight": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.64.down_proj.weight_scale": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.64.gate_proj.weight": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.64.gate_proj.weight_scale": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.64.up_proj.weight": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.64.up_proj.weight_scale": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.65.down_proj.weight": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.65.down_proj.weight_scale": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.65.gate_proj.weight": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.65.gate_proj.weight_scale": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.65.up_proj.weight": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.65.up_proj.weight_scale": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.66.down_proj.weight": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.66.down_proj.weight_scale": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.66.gate_proj.weight": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.66.gate_proj.weight_scale": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.66.up_proj.weight": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.66.up_proj.weight_scale": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.67.down_proj.weight": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.67.down_proj.weight_scale": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.67.gate_proj.weight": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.67.gate_proj.weight_scale": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.67.up_proj.weight": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.67.up_proj.weight_scale": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.68.down_proj.weight": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.68.down_proj.weight_scale": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.68.gate_proj.weight": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.68.gate_proj.weight_scale": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.68.up_proj.weight": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.68.up_proj.weight_scale": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.69.down_proj.weight": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.69.down_proj.weight_scale": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.69.gate_proj.weight": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.69.gate_proj.weight_scale": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.69.up_proj.weight": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.69.up_proj.weight_scale": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.7.down_proj.weight": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.7.down_proj.weight_scale": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.7.gate_proj.weight": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.7.gate_proj.weight_scale": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.7.up_proj.weight": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.7.up_proj.weight_scale": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.70.down_proj.weight": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.70.down_proj.weight_scale": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.70.gate_proj.weight": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.70.gate_proj.weight_scale": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.70.up_proj.weight": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.70.up_proj.weight_scale": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.71.down_proj.weight": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.71.down_proj.weight_scale": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.71.gate_proj.weight": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.71.gate_proj.weight_scale": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.71.up_proj.weight": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.71.up_proj.weight_scale": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.72.down_proj.weight": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.72.down_proj.weight_scale": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.72.gate_proj.weight": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.72.gate_proj.weight_scale": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.72.up_proj.weight": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.72.up_proj.weight_scale": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.73.down_proj.weight": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.73.down_proj.weight_scale": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.73.gate_proj.weight": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.73.gate_proj.weight_scale": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.73.up_proj.weight": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.73.up_proj.weight_scale": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.74.down_proj.weight": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.74.down_proj.weight_scale": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.74.gate_proj.weight": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.74.gate_proj.weight_scale": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.74.up_proj.weight": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.74.up_proj.weight_scale": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.75.down_proj.weight": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.75.down_proj.weight_scale": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.75.gate_proj.weight": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.75.gate_proj.weight_scale": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.75.up_proj.weight": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.75.up_proj.weight_scale": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.76.down_proj.weight": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.76.down_proj.weight_scale": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.76.gate_proj.weight": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.76.gate_proj.weight_scale": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.76.up_proj.weight": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.76.up_proj.weight_scale": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.77.down_proj.weight": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.77.down_proj.weight_scale": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.77.gate_proj.weight": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.77.gate_proj.weight_scale": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.77.up_proj.weight": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.77.up_proj.weight_scale": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.78.down_proj.weight": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.78.down_proj.weight_scale": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.78.gate_proj.weight": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.78.gate_proj.weight_scale": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.78.up_proj.weight": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.78.up_proj.weight_scale": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.79.down_proj.weight": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.79.down_proj.weight_scale": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.79.gate_proj.weight": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.79.gate_proj.weight_scale": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.79.up_proj.weight": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.79.up_proj.weight_scale": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.8.down_proj.weight": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.8.down_proj.weight_scale": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.8.gate_proj.weight": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.8.gate_proj.weight_scale": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.8.up_proj.weight": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.8.up_proj.weight_scale": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.80.down_proj.weight": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.80.down_proj.weight_scale": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.80.gate_proj.weight": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.80.gate_proj.weight_scale": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.80.up_proj.weight": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.80.up_proj.weight_scale": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.81.down_proj.weight": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.81.down_proj.weight_scale": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.81.gate_proj.weight": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.81.gate_proj.weight_scale": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.81.up_proj.weight": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.81.up_proj.weight_scale": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.82.down_proj.weight": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.82.down_proj.weight_scale": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.82.gate_proj.weight": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.82.gate_proj.weight_scale": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.82.up_proj.weight": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.82.up_proj.weight_scale": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.83.down_proj.weight": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.83.down_proj.weight_scale": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.83.gate_proj.weight": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.83.gate_proj.weight_scale": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.83.up_proj.weight": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.83.up_proj.weight_scale": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.84.down_proj.weight": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.84.down_proj.weight_scale": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.84.gate_proj.weight": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.84.gate_proj.weight_scale": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.84.up_proj.weight": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.84.up_proj.weight_scale": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.85.down_proj.weight": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.85.down_proj.weight_scale": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.85.gate_proj.weight": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.85.gate_proj.weight_scale": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.85.up_proj.weight": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.85.up_proj.weight_scale": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.86.down_proj.weight": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.86.down_proj.weight_scale": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.86.gate_proj.weight": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.86.gate_proj.weight_scale": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.86.up_proj.weight": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.86.up_proj.weight_scale": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.87.down_proj.weight": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.87.down_proj.weight_scale": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.87.gate_proj.weight": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.87.gate_proj.weight_scale": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.87.up_proj.weight": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.87.up_proj.weight_scale": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.88.down_proj.weight": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.88.down_proj.weight_scale": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.88.gate_proj.weight": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.88.gate_proj.weight_scale": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.88.up_proj.weight": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.88.up_proj.weight_scale": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.89.down_proj.weight": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.89.down_proj.weight_scale": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.89.gate_proj.weight": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.89.gate_proj.weight_scale": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.89.up_proj.weight": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.89.up_proj.weight_scale": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.9.down_proj.weight": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.9.down_proj.weight_scale": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.9.gate_proj.weight": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.9.gate_proj.weight_scale": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.9.up_proj.weight": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.9.up_proj.weight_scale": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.90.down_proj.weight": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.90.down_proj.weight_scale": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.90.gate_proj.weight": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.90.gate_proj.weight_scale": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.90.up_proj.weight": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.90.up_proj.weight_scale": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.91.down_proj.weight": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.91.down_proj.weight_scale": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.91.gate_proj.weight": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.91.gate_proj.weight_scale": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.91.up_proj.weight": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.91.up_proj.weight_scale": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.92.down_proj.weight": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.92.down_proj.weight_scale": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.92.gate_proj.weight": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.92.gate_proj.weight_scale": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.92.up_proj.weight": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.92.up_proj.weight_scale": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.93.down_proj.weight": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.93.down_proj.weight_scale": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.93.gate_proj.weight": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.93.gate_proj.weight_scale": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.93.up_proj.weight": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.93.up_proj.weight_scale": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.94.down_proj.weight": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.94.down_proj.weight_scale": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.94.gate_proj.weight": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.94.gate_proj.weight_scale": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.94.up_proj.weight": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.94.up_proj.weight_scale": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.95.down_proj.weight": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.95.down_proj.weight_scale": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.95.gate_proj.weight": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.95.gate_proj.weight_scale": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.95.up_proj.weight": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.95.up_proj.weight_scale": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.96.down_proj.weight": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.96.down_proj.weight_scale": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.96.gate_proj.weight": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.96.gate_proj.weight_scale": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.96.up_proj.weight": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.96.up_proj.weight_scale": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.97.down_proj.weight": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.97.down_proj.weight_scale": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.97.gate_proj.weight": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.97.gate_proj.weight_scale": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.97.up_proj.weight": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.97.up_proj.weight_scale": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.98.down_proj.weight": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.98.down_proj.weight_scale": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.98.gate_proj.weight": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.98.gate_proj.weight_scale": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.98.up_proj.weight": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.98.up_proj.weight_scale": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.99.down_proj.weight": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.99.down_proj.weight_scale": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.99.gate_proj.weight": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.99.gate_proj.weight_scale": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.99.up_proj.weight": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.99.up_proj.weight_scale": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.gate.e_score_correction_bias": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.gate.weight": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.shared_experts.down_proj.weight": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.shared_experts.down_proj.weight_scale": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.shared_experts.gate_proj.weight": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.shared_experts.gate_proj.weight_scale": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.shared_experts.up_proj.weight": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.shared_experts.up_proj.weight_scale": "model-00085-of-00092.safetensors",
+ "model.layers.84.post_attention_layernorm.weight": "model-00085-of-00092.safetensors",
+ "model.layers.84.self_attn.k_norm.weight": "model-00085-of-00092.safetensors",
+ "model.layers.84.self_attn.k_proj.bias": "model-00085-of-00092.safetensors",
+ "model.layers.84.self_attn.k_proj.weight": "model-00085-of-00092.safetensors",
+ "model.layers.84.self_attn.k_proj.weight_scale": "model-00085-of-00092.safetensors",
+ "model.layers.84.self_attn.o_proj.weight": "model-00085-of-00092.safetensors",
+ "model.layers.84.self_attn.o_proj.weight_scale": "model-00085-of-00092.safetensors",
+ "model.layers.84.self_attn.q_norm.weight": "model-00085-of-00092.safetensors",
+ "model.layers.84.self_attn.q_proj.bias": "model-00085-of-00092.safetensors",
+ "model.layers.84.self_attn.q_proj.weight": "model-00085-of-00092.safetensors",
+ "model.layers.84.self_attn.q_proj.weight_scale": "model-00085-of-00092.safetensors",
+ "model.layers.84.self_attn.v_proj.bias": "model-00085-of-00092.safetensors",
+ "model.layers.84.self_attn.v_proj.weight": "model-00085-of-00092.safetensors",
+ "model.layers.84.self_attn.v_proj.weight_scale": "model-00085-of-00092.safetensors",
+ "model.layers.85.input_layernorm.weight": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.0.down_proj.weight": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.0.down_proj.weight_scale": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.0.gate_proj.weight": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.0.gate_proj.weight_scale": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.0.up_proj.weight": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.0.up_proj.weight_scale": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.1.down_proj.weight": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.1.down_proj.weight_scale": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.1.gate_proj.weight": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.1.gate_proj.weight_scale": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.1.up_proj.weight": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.1.up_proj.weight_scale": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.10.down_proj.weight": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.10.down_proj.weight_scale": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.10.gate_proj.weight": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.10.gate_proj.weight_scale": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.10.up_proj.weight": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.10.up_proj.weight_scale": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.100.down_proj.weight": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.100.down_proj.weight_scale": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.100.gate_proj.weight": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.100.gate_proj.weight_scale": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.100.up_proj.weight": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.100.up_proj.weight_scale": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.101.down_proj.weight": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.101.down_proj.weight_scale": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.101.gate_proj.weight": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.101.gate_proj.weight_scale": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.101.up_proj.weight": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.101.up_proj.weight_scale": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.102.down_proj.weight": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.102.down_proj.weight_scale": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.102.gate_proj.weight": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.102.gate_proj.weight_scale": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.102.up_proj.weight": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.102.up_proj.weight_scale": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.103.down_proj.weight": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.103.down_proj.weight_scale": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.103.gate_proj.weight": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.103.gate_proj.weight_scale": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.103.up_proj.weight": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.103.up_proj.weight_scale": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.104.down_proj.weight": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.104.down_proj.weight_scale": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.104.gate_proj.weight": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.104.gate_proj.weight_scale": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.104.up_proj.weight": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.104.up_proj.weight_scale": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.105.down_proj.weight": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.105.down_proj.weight_scale": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.105.gate_proj.weight": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.105.gate_proj.weight_scale": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.105.up_proj.weight": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.105.up_proj.weight_scale": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.106.down_proj.weight": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.106.down_proj.weight_scale": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.106.gate_proj.weight": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.106.gate_proj.weight_scale": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.106.up_proj.weight": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.106.up_proj.weight_scale": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.107.down_proj.weight": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.107.down_proj.weight_scale": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.107.gate_proj.weight": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.107.gate_proj.weight_scale": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.107.up_proj.weight": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.107.up_proj.weight_scale": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.108.down_proj.weight": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.108.down_proj.weight_scale": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.108.gate_proj.weight": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.108.gate_proj.weight_scale": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.108.up_proj.weight": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.108.up_proj.weight_scale": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.109.down_proj.weight": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.109.down_proj.weight_scale": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.109.gate_proj.weight": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.109.gate_proj.weight_scale": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.109.up_proj.weight": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.109.up_proj.weight_scale": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.11.down_proj.weight": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.11.down_proj.weight_scale": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.11.gate_proj.weight": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.11.gate_proj.weight_scale": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.11.up_proj.weight": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.11.up_proj.weight_scale": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.110.down_proj.weight": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.110.down_proj.weight_scale": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.110.gate_proj.weight": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.110.gate_proj.weight_scale": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.110.up_proj.weight": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.110.up_proj.weight_scale": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.111.down_proj.weight": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.111.down_proj.weight_scale": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.111.gate_proj.weight": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.111.gate_proj.weight_scale": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.111.up_proj.weight": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.111.up_proj.weight_scale": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.112.down_proj.weight": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.112.down_proj.weight_scale": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.112.gate_proj.weight": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.112.gate_proj.weight_scale": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.112.up_proj.weight": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.112.up_proj.weight_scale": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.113.down_proj.weight": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.113.down_proj.weight_scale": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.113.gate_proj.weight": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.113.gate_proj.weight_scale": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.113.up_proj.weight": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.113.up_proj.weight_scale": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.114.down_proj.weight": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.114.down_proj.weight_scale": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.114.gate_proj.weight": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.114.gate_proj.weight_scale": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.114.up_proj.weight": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.114.up_proj.weight_scale": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.115.down_proj.weight": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.115.down_proj.weight_scale": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.115.gate_proj.weight": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.115.gate_proj.weight_scale": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.115.up_proj.weight": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.115.up_proj.weight_scale": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.116.down_proj.weight": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.116.down_proj.weight_scale": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.116.gate_proj.weight": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.116.gate_proj.weight_scale": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.116.up_proj.weight": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.116.up_proj.weight_scale": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.117.down_proj.weight": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.117.down_proj.weight_scale": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.117.gate_proj.weight": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.117.gate_proj.weight_scale": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.117.up_proj.weight": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.117.up_proj.weight_scale": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.118.down_proj.weight": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.118.down_proj.weight_scale": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.118.gate_proj.weight": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.118.gate_proj.weight_scale": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.118.up_proj.weight": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.118.up_proj.weight_scale": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.119.down_proj.weight": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.119.down_proj.weight_scale": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.119.gate_proj.weight": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.119.gate_proj.weight_scale": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.119.up_proj.weight": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.119.up_proj.weight_scale": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.12.down_proj.weight": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.12.down_proj.weight_scale": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.12.gate_proj.weight": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.12.gate_proj.weight_scale": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.12.up_proj.weight": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.12.up_proj.weight_scale": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.120.down_proj.weight": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.120.down_proj.weight_scale": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.120.gate_proj.weight": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.120.gate_proj.weight_scale": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.120.up_proj.weight": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.120.up_proj.weight_scale": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.121.down_proj.weight": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.121.down_proj.weight_scale": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.121.gate_proj.weight": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.121.gate_proj.weight_scale": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.121.up_proj.weight": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.121.up_proj.weight_scale": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.122.down_proj.weight": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.122.down_proj.weight_scale": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.122.gate_proj.weight": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.122.gate_proj.weight_scale": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.122.up_proj.weight": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.122.up_proj.weight_scale": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.123.down_proj.weight": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.123.down_proj.weight_scale": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.123.gate_proj.weight": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.123.gate_proj.weight_scale": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.123.up_proj.weight": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.123.up_proj.weight_scale": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.124.down_proj.weight": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.124.down_proj.weight_scale": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.124.gate_proj.weight": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.124.gate_proj.weight_scale": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.124.up_proj.weight": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.124.up_proj.weight_scale": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.125.down_proj.weight": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.125.down_proj.weight_scale": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.125.gate_proj.weight": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.125.gate_proj.weight_scale": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.125.up_proj.weight": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.125.up_proj.weight_scale": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.126.down_proj.weight": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.126.down_proj.weight_scale": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.126.gate_proj.weight": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.126.gate_proj.weight_scale": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.126.up_proj.weight": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.126.up_proj.weight_scale": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.127.down_proj.weight": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.127.down_proj.weight_scale": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.127.gate_proj.weight": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.127.gate_proj.weight_scale": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.127.up_proj.weight": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.127.up_proj.weight_scale": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.128.down_proj.weight": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.128.down_proj.weight_scale": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.128.gate_proj.weight": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.128.gate_proj.weight_scale": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.128.up_proj.weight": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.128.up_proj.weight_scale": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.129.down_proj.weight": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.129.down_proj.weight_scale": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.129.gate_proj.weight": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.129.gate_proj.weight_scale": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.129.up_proj.weight": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.129.up_proj.weight_scale": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.13.down_proj.weight": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.13.down_proj.weight_scale": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.13.gate_proj.weight": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.13.gate_proj.weight_scale": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.13.up_proj.weight": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.13.up_proj.weight_scale": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.130.down_proj.weight": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.130.down_proj.weight_scale": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.130.gate_proj.weight": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.130.gate_proj.weight_scale": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.130.up_proj.weight": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.130.up_proj.weight_scale": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.131.down_proj.weight": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.131.down_proj.weight_scale": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.131.gate_proj.weight": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.131.gate_proj.weight_scale": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.131.up_proj.weight": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.131.up_proj.weight_scale": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.132.down_proj.weight": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.132.down_proj.weight_scale": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.132.gate_proj.weight": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.132.gate_proj.weight_scale": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.132.up_proj.weight": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.132.up_proj.weight_scale": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.133.down_proj.weight": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.133.down_proj.weight_scale": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.133.gate_proj.weight": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.133.gate_proj.weight_scale": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.133.up_proj.weight": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.133.up_proj.weight_scale": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.134.down_proj.weight": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.134.down_proj.weight_scale": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.134.gate_proj.weight": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.134.gate_proj.weight_scale": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.134.up_proj.weight": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.134.up_proj.weight_scale": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.135.down_proj.weight": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.135.down_proj.weight_scale": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.135.gate_proj.weight": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.135.gate_proj.weight_scale": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.135.up_proj.weight": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.135.up_proj.weight_scale": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.136.down_proj.weight": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.136.down_proj.weight_scale": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.136.gate_proj.weight": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.136.gate_proj.weight_scale": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.136.up_proj.weight": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.136.up_proj.weight_scale": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.137.down_proj.weight": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.137.down_proj.weight_scale": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.137.gate_proj.weight": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.137.gate_proj.weight_scale": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.137.up_proj.weight": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.137.up_proj.weight_scale": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.138.down_proj.weight": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.138.down_proj.weight_scale": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.138.gate_proj.weight": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.138.gate_proj.weight_scale": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.138.up_proj.weight": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.138.up_proj.weight_scale": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.139.down_proj.weight": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.139.down_proj.weight_scale": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.139.gate_proj.weight": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.139.gate_proj.weight_scale": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.139.up_proj.weight": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.139.up_proj.weight_scale": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.14.down_proj.weight": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.14.down_proj.weight_scale": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.14.gate_proj.weight": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.14.gate_proj.weight_scale": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.14.up_proj.weight": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.14.up_proj.weight_scale": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.140.down_proj.weight": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.140.down_proj.weight_scale": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.140.gate_proj.weight": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.140.gate_proj.weight_scale": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.140.up_proj.weight": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.140.up_proj.weight_scale": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.141.down_proj.weight": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.141.down_proj.weight_scale": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.141.gate_proj.weight": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.141.gate_proj.weight_scale": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.141.up_proj.weight": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.141.up_proj.weight_scale": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.142.down_proj.weight": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.142.down_proj.weight_scale": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.142.gate_proj.weight": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.142.gate_proj.weight_scale": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.142.up_proj.weight": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.142.up_proj.weight_scale": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.143.down_proj.weight": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.143.down_proj.weight_scale": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.143.gate_proj.weight": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.143.gate_proj.weight_scale": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.143.up_proj.weight": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.143.up_proj.weight_scale": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.144.down_proj.weight": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.144.down_proj.weight_scale": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.144.gate_proj.weight": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.144.gate_proj.weight_scale": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.144.up_proj.weight": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.144.up_proj.weight_scale": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.145.down_proj.weight": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.145.down_proj.weight_scale": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.145.gate_proj.weight": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.145.gate_proj.weight_scale": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.145.up_proj.weight": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.145.up_proj.weight_scale": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.146.down_proj.weight": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.146.down_proj.weight_scale": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.146.gate_proj.weight": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.146.gate_proj.weight_scale": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.146.up_proj.weight": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.146.up_proj.weight_scale": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.147.down_proj.weight": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.147.down_proj.weight_scale": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.147.gate_proj.weight": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.147.gate_proj.weight_scale": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.147.up_proj.weight": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.147.up_proj.weight_scale": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.148.down_proj.weight": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.148.down_proj.weight_scale": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.148.gate_proj.weight": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.148.gate_proj.weight_scale": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.148.up_proj.weight": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.148.up_proj.weight_scale": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.149.down_proj.weight": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.149.down_proj.weight_scale": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.149.gate_proj.weight": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.149.gate_proj.weight_scale": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.149.up_proj.weight": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.149.up_proj.weight_scale": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.15.down_proj.weight": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.15.down_proj.weight_scale": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.15.gate_proj.weight": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.15.gate_proj.weight_scale": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.15.up_proj.weight": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.15.up_proj.weight_scale": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.150.down_proj.weight": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.150.down_proj.weight_scale": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.150.gate_proj.weight": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.150.gate_proj.weight_scale": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.150.up_proj.weight": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.150.up_proj.weight_scale": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.151.down_proj.weight": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.151.down_proj.weight_scale": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.151.gate_proj.weight": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.151.gate_proj.weight_scale": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.151.up_proj.weight": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.151.up_proj.weight_scale": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.152.down_proj.weight": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.152.down_proj.weight_scale": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.152.gate_proj.weight": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.152.gate_proj.weight_scale": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.152.up_proj.weight": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.152.up_proj.weight_scale": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.153.down_proj.weight": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.153.down_proj.weight_scale": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.153.gate_proj.weight": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.153.gate_proj.weight_scale": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.153.up_proj.weight": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.153.up_proj.weight_scale": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.154.down_proj.weight": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.154.down_proj.weight_scale": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.154.gate_proj.weight": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.154.gate_proj.weight_scale": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.154.up_proj.weight": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.154.up_proj.weight_scale": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.155.down_proj.weight": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.155.down_proj.weight_scale": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.155.gate_proj.weight": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.155.gate_proj.weight_scale": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.155.up_proj.weight": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.155.up_proj.weight_scale": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.156.down_proj.weight": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.156.down_proj.weight_scale": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.156.gate_proj.weight": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.156.gate_proj.weight_scale": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.156.up_proj.weight": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.156.up_proj.weight_scale": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.157.down_proj.weight": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.157.down_proj.weight_scale": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.157.gate_proj.weight": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.157.gate_proj.weight_scale": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.157.up_proj.weight": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.157.up_proj.weight_scale": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.158.down_proj.weight": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.158.down_proj.weight_scale": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.158.gate_proj.weight": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.158.gate_proj.weight_scale": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.158.up_proj.weight": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.158.up_proj.weight_scale": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.159.down_proj.weight": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.159.down_proj.weight_scale": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.159.gate_proj.weight": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.159.gate_proj.weight_scale": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.159.up_proj.weight": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.159.up_proj.weight_scale": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.16.down_proj.weight": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.16.down_proj.weight_scale": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.16.gate_proj.weight": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.16.gate_proj.weight_scale": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.16.up_proj.weight": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.16.up_proj.weight_scale": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.17.down_proj.weight": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.17.down_proj.weight_scale": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.17.gate_proj.weight": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.17.gate_proj.weight_scale": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.17.up_proj.weight": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.17.up_proj.weight_scale": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.18.down_proj.weight": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.18.down_proj.weight_scale": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.18.gate_proj.weight": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.18.gate_proj.weight_scale": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.18.up_proj.weight": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.18.up_proj.weight_scale": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.19.down_proj.weight": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.19.down_proj.weight_scale": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.19.gate_proj.weight": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.19.gate_proj.weight_scale": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.19.up_proj.weight": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.19.up_proj.weight_scale": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.2.down_proj.weight": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.2.down_proj.weight_scale": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.2.gate_proj.weight": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.2.gate_proj.weight_scale": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.2.up_proj.weight": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.2.up_proj.weight_scale": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.20.down_proj.weight": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.20.down_proj.weight_scale": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.20.gate_proj.weight": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.20.gate_proj.weight_scale": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.20.up_proj.weight": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.20.up_proj.weight_scale": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.21.down_proj.weight": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.21.down_proj.weight_scale": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.21.gate_proj.weight": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.21.gate_proj.weight_scale": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.21.up_proj.weight": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.21.up_proj.weight_scale": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.22.down_proj.weight": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.22.down_proj.weight_scale": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.22.gate_proj.weight": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.22.gate_proj.weight_scale": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.22.up_proj.weight": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.22.up_proj.weight_scale": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.23.down_proj.weight": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.23.down_proj.weight_scale": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.23.gate_proj.weight": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.23.gate_proj.weight_scale": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.23.up_proj.weight": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.23.up_proj.weight_scale": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.24.down_proj.weight": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.24.down_proj.weight_scale": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.24.gate_proj.weight": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.24.gate_proj.weight_scale": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.24.up_proj.weight": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.24.up_proj.weight_scale": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.25.down_proj.weight": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.25.down_proj.weight_scale": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.25.gate_proj.weight": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.25.gate_proj.weight_scale": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.25.up_proj.weight": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.25.up_proj.weight_scale": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.26.down_proj.weight": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.26.down_proj.weight_scale": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.26.gate_proj.weight": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.26.gate_proj.weight_scale": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.26.up_proj.weight": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.26.up_proj.weight_scale": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.27.down_proj.weight": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.27.down_proj.weight_scale": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.27.gate_proj.weight": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.27.gate_proj.weight_scale": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.27.up_proj.weight": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.27.up_proj.weight_scale": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.28.down_proj.weight": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.28.down_proj.weight_scale": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.28.gate_proj.weight": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.28.gate_proj.weight_scale": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.28.up_proj.weight": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.28.up_proj.weight_scale": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.29.down_proj.weight": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.29.down_proj.weight_scale": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.29.gate_proj.weight": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.29.gate_proj.weight_scale": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.29.up_proj.weight": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.29.up_proj.weight_scale": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.3.down_proj.weight": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.3.down_proj.weight_scale": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.3.gate_proj.weight": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.3.gate_proj.weight_scale": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.3.up_proj.weight": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.3.up_proj.weight_scale": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.30.down_proj.weight": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.30.down_proj.weight_scale": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.30.gate_proj.weight": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.30.gate_proj.weight_scale": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.30.up_proj.weight": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.30.up_proj.weight_scale": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.31.down_proj.weight": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.31.down_proj.weight_scale": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.31.gate_proj.weight": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.31.gate_proj.weight_scale": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.31.up_proj.weight": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.31.up_proj.weight_scale": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.32.down_proj.weight": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.32.down_proj.weight_scale": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.32.gate_proj.weight": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.32.gate_proj.weight_scale": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.32.up_proj.weight": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.32.up_proj.weight_scale": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.33.down_proj.weight": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.33.down_proj.weight_scale": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.33.gate_proj.weight": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.33.gate_proj.weight_scale": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.33.up_proj.weight": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.33.up_proj.weight_scale": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.34.down_proj.weight": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.34.down_proj.weight_scale": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.34.gate_proj.weight": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.34.gate_proj.weight_scale": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.34.up_proj.weight": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.34.up_proj.weight_scale": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.35.down_proj.weight": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.35.down_proj.weight_scale": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.35.gate_proj.weight": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.35.gate_proj.weight_scale": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.35.up_proj.weight": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.35.up_proj.weight_scale": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.36.down_proj.weight": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.36.down_proj.weight_scale": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.36.gate_proj.weight": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.36.gate_proj.weight_scale": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.36.up_proj.weight": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.36.up_proj.weight_scale": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.37.down_proj.weight": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.37.down_proj.weight_scale": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.37.gate_proj.weight": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.37.gate_proj.weight_scale": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.37.up_proj.weight": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.37.up_proj.weight_scale": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.38.down_proj.weight": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.38.down_proj.weight_scale": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.38.gate_proj.weight": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.38.gate_proj.weight_scale": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.38.up_proj.weight": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.38.up_proj.weight_scale": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.39.down_proj.weight": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.39.down_proj.weight_scale": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.39.gate_proj.weight": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.39.gate_proj.weight_scale": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.39.up_proj.weight": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.39.up_proj.weight_scale": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.4.down_proj.weight": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.4.down_proj.weight_scale": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.4.gate_proj.weight": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.4.gate_proj.weight_scale": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.4.up_proj.weight": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.4.up_proj.weight_scale": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.40.down_proj.weight": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.40.down_proj.weight_scale": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.40.gate_proj.weight": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.40.gate_proj.weight_scale": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.40.up_proj.weight": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.40.up_proj.weight_scale": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.41.down_proj.weight": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.41.down_proj.weight_scale": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.41.gate_proj.weight": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.41.gate_proj.weight_scale": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.41.up_proj.weight": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.41.up_proj.weight_scale": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.42.down_proj.weight": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.42.down_proj.weight_scale": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.42.gate_proj.weight": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.42.gate_proj.weight_scale": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.42.up_proj.weight": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.42.up_proj.weight_scale": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.43.down_proj.weight": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.43.down_proj.weight_scale": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.43.gate_proj.weight": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.43.gate_proj.weight_scale": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.43.up_proj.weight": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.43.up_proj.weight_scale": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.44.down_proj.weight": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.44.down_proj.weight_scale": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.44.gate_proj.weight": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.44.gate_proj.weight_scale": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.44.up_proj.weight": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.44.up_proj.weight_scale": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.45.down_proj.weight": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.45.down_proj.weight_scale": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.45.gate_proj.weight": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.45.gate_proj.weight_scale": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.45.up_proj.weight": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.45.up_proj.weight_scale": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.46.down_proj.weight": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.46.down_proj.weight_scale": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.46.gate_proj.weight": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.46.gate_proj.weight_scale": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.46.up_proj.weight": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.46.up_proj.weight_scale": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.47.down_proj.weight": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.47.down_proj.weight_scale": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.47.gate_proj.weight": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.47.gate_proj.weight_scale": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.47.up_proj.weight": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.47.up_proj.weight_scale": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.48.down_proj.weight": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.48.down_proj.weight_scale": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.48.gate_proj.weight": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.48.gate_proj.weight_scale": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.48.up_proj.weight": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.48.up_proj.weight_scale": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.49.down_proj.weight": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.49.down_proj.weight_scale": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.49.gate_proj.weight": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.49.gate_proj.weight_scale": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.49.up_proj.weight": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.49.up_proj.weight_scale": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.5.down_proj.weight": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.5.down_proj.weight_scale": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.5.gate_proj.weight": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.5.gate_proj.weight_scale": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.5.up_proj.weight": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.5.up_proj.weight_scale": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.50.down_proj.weight": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.50.down_proj.weight_scale": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.50.gate_proj.weight": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.50.gate_proj.weight_scale": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.50.up_proj.weight": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.50.up_proj.weight_scale": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.51.down_proj.weight": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.51.down_proj.weight_scale": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.51.gate_proj.weight": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.51.gate_proj.weight_scale": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.51.up_proj.weight": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.51.up_proj.weight_scale": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.52.down_proj.weight": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.52.down_proj.weight_scale": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.52.gate_proj.weight": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.52.gate_proj.weight_scale": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.52.up_proj.weight": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.52.up_proj.weight_scale": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.53.down_proj.weight": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.53.down_proj.weight_scale": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.53.gate_proj.weight": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.53.gate_proj.weight_scale": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.53.up_proj.weight": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.53.up_proj.weight_scale": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.54.down_proj.weight": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.54.down_proj.weight_scale": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.54.gate_proj.weight": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.54.gate_proj.weight_scale": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.54.up_proj.weight": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.54.up_proj.weight_scale": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.55.down_proj.weight": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.55.down_proj.weight_scale": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.55.gate_proj.weight": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.55.gate_proj.weight_scale": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.55.up_proj.weight": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.55.up_proj.weight_scale": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.56.down_proj.weight": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.56.down_proj.weight_scale": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.56.gate_proj.weight": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.56.gate_proj.weight_scale": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.56.up_proj.weight": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.56.up_proj.weight_scale": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.57.down_proj.weight": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.57.down_proj.weight_scale": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.57.gate_proj.weight": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.57.gate_proj.weight_scale": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.57.up_proj.weight": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.57.up_proj.weight_scale": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.58.down_proj.weight": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.58.down_proj.weight_scale": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.58.gate_proj.weight": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.58.gate_proj.weight_scale": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.58.up_proj.weight": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.58.up_proj.weight_scale": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.59.down_proj.weight": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.59.down_proj.weight_scale": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.59.gate_proj.weight": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.59.gate_proj.weight_scale": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.59.up_proj.weight": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.59.up_proj.weight_scale": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.6.down_proj.weight": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.6.down_proj.weight_scale": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.6.gate_proj.weight": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.6.gate_proj.weight_scale": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.6.up_proj.weight": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.6.up_proj.weight_scale": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.60.down_proj.weight": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.60.down_proj.weight_scale": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.60.gate_proj.weight": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.60.gate_proj.weight_scale": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.60.up_proj.weight": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.60.up_proj.weight_scale": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.61.down_proj.weight": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.61.down_proj.weight_scale": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.61.gate_proj.weight": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.61.gate_proj.weight_scale": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.61.up_proj.weight": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.61.up_proj.weight_scale": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.62.down_proj.weight": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.62.down_proj.weight_scale": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.62.gate_proj.weight": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.62.gate_proj.weight_scale": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.62.up_proj.weight": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.62.up_proj.weight_scale": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.63.down_proj.weight": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.63.down_proj.weight_scale": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.63.gate_proj.weight": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.63.gate_proj.weight_scale": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.63.up_proj.weight": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.63.up_proj.weight_scale": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.64.down_proj.weight": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.64.down_proj.weight_scale": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.64.gate_proj.weight": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.64.gate_proj.weight_scale": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.64.up_proj.weight": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.64.up_proj.weight_scale": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.65.down_proj.weight": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.65.down_proj.weight_scale": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.65.gate_proj.weight": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.65.gate_proj.weight_scale": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.65.up_proj.weight": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.65.up_proj.weight_scale": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.66.down_proj.weight": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.66.down_proj.weight_scale": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.66.gate_proj.weight": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.66.gate_proj.weight_scale": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.66.up_proj.weight": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.66.up_proj.weight_scale": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.67.down_proj.weight": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.67.down_proj.weight_scale": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.67.gate_proj.weight": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.67.gate_proj.weight_scale": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.67.up_proj.weight": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.67.up_proj.weight_scale": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.68.down_proj.weight": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.68.down_proj.weight_scale": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.68.gate_proj.weight": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.68.gate_proj.weight_scale": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.68.up_proj.weight": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.68.up_proj.weight_scale": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.69.down_proj.weight": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.69.down_proj.weight_scale": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.69.gate_proj.weight": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.69.gate_proj.weight_scale": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.69.up_proj.weight": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.69.up_proj.weight_scale": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.7.down_proj.weight": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.7.down_proj.weight_scale": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.7.gate_proj.weight": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.7.gate_proj.weight_scale": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.7.up_proj.weight": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.7.up_proj.weight_scale": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.70.down_proj.weight": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.70.down_proj.weight_scale": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.70.gate_proj.weight": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.70.gate_proj.weight_scale": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.70.up_proj.weight": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.70.up_proj.weight_scale": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.71.down_proj.weight": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.71.down_proj.weight_scale": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.71.gate_proj.weight": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.71.gate_proj.weight_scale": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.71.up_proj.weight": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.71.up_proj.weight_scale": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.72.down_proj.weight": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.72.down_proj.weight_scale": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.72.gate_proj.weight": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.72.gate_proj.weight_scale": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.72.up_proj.weight": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.72.up_proj.weight_scale": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.73.down_proj.weight": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.73.down_proj.weight_scale": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.73.gate_proj.weight": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.73.gate_proj.weight_scale": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.73.up_proj.weight": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.73.up_proj.weight_scale": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.74.down_proj.weight": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.74.down_proj.weight_scale": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.74.gate_proj.weight": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.74.gate_proj.weight_scale": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.74.up_proj.weight": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.74.up_proj.weight_scale": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.75.down_proj.weight": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.75.down_proj.weight_scale": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.75.gate_proj.weight": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.75.gate_proj.weight_scale": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.75.up_proj.weight": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.75.up_proj.weight_scale": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.76.down_proj.weight": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.76.down_proj.weight_scale": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.76.gate_proj.weight": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.76.gate_proj.weight_scale": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.76.up_proj.weight": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.76.up_proj.weight_scale": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.77.down_proj.weight": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.77.down_proj.weight_scale": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.77.gate_proj.weight": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.77.gate_proj.weight_scale": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.77.up_proj.weight": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.77.up_proj.weight_scale": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.78.down_proj.weight": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.78.down_proj.weight_scale": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.78.gate_proj.weight": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.78.gate_proj.weight_scale": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.78.up_proj.weight": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.78.up_proj.weight_scale": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.79.down_proj.weight": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.79.down_proj.weight_scale": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.79.gate_proj.weight": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.79.gate_proj.weight_scale": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.79.up_proj.weight": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.79.up_proj.weight_scale": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.8.down_proj.weight": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.8.down_proj.weight_scale": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.8.gate_proj.weight": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.8.gate_proj.weight_scale": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.8.up_proj.weight": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.8.up_proj.weight_scale": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.80.down_proj.weight": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.80.down_proj.weight_scale": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.80.gate_proj.weight": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.80.gate_proj.weight_scale": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.80.up_proj.weight": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.80.up_proj.weight_scale": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.81.down_proj.weight": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.81.down_proj.weight_scale": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.81.gate_proj.weight": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.81.gate_proj.weight_scale": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.81.up_proj.weight": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.81.up_proj.weight_scale": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.82.down_proj.weight": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.82.down_proj.weight_scale": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.82.gate_proj.weight": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.82.gate_proj.weight_scale": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.82.up_proj.weight": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.82.up_proj.weight_scale": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.83.down_proj.weight": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.83.down_proj.weight_scale": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.83.gate_proj.weight": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.83.gate_proj.weight_scale": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.83.up_proj.weight": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.83.up_proj.weight_scale": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.84.down_proj.weight": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.84.down_proj.weight_scale": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.84.gate_proj.weight": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.84.gate_proj.weight_scale": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.84.up_proj.weight": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.84.up_proj.weight_scale": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.85.down_proj.weight": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.85.down_proj.weight_scale": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.85.gate_proj.weight": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.85.gate_proj.weight_scale": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.85.up_proj.weight": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.85.up_proj.weight_scale": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.86.down_proj.weight": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.86.down_proj.weight_scale": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.86.gate_proj.weight": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.86.gate_proj.weight_scale": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.86.up_proj.weight": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.86.up_proj.weight_scale": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.87.down_proj.weight": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.87.down_proj.weight_scale": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.87.gate_proj.weight": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.87.gate_proj.weight_scale": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.87.up_proj.weight": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.87.up_proj.weight_scale": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.88.down_proj.weight": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.88.down_proj.weight_scale": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.88.gate_proj.weight": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.88.gate_proj.weight_scale": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.88.up_proj.weight": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.88.up_proj.weight_scale": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.89.down_proj.weight": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.89.down_proj.weight_scale": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.89.gate_proj.weight": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.89.gate_proj.weight_scale": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.89.up_proj.weight": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.89.up_proj.weight_scale": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.9.down_proj.weight": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.9.down_proj.weight_scale": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.9.gate_proj.weight": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.9.gate_proj.weight_scale": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.9.up_proj.weight": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.9.up_proj.weight_scale": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.90.down_proj.weight": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.90.down_proj.weight_scale": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.90.gate_proj.weight": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.90.gate_proj.weight_scale": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.90.up_proj.weight": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.90.up_proj.weight_scale": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.91.down_proj.weight": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.91.down_proj.weight_scale": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.91.gate_proj.weight": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.91.gate_proj.weight_scale": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.91.up_proj.weight": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.91.up_proj.weight_scale": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.92.down_proj.weight": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.92.down_proj.weight_scale": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.92.gate_proj.weight": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.92.gate_proj.weight_scale": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.92.up_proj.weight": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.92.up_proj.weight_scale": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.93.down_proj.weight": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.93.down_proj.weight_scale": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.93.gate_proj.weight": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.93.gate_proj.weight_scale": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.93.up_proj.weight": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.93.up_proj.weight_scale": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.94.down_proj.weight": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.94.down_proj.weight_scale": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.94.gate_proj.weight": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.94.gate_proj.weight_scale": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.94.up_proj.weight": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.94.up_proj.weight_scale": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.95.down_proj.weight": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.95.down_proj.weight_scale": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.95.gate_proj.weight": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.95.gate_proj.weight_scale": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.95.up_proj.weight": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.95.up_proj.weight_scale": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.96.down_proj.weight": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.96.down_proj.weight_scale": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.96.gate_proj.weight": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.96.gate_proj.weight_scale": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.96.up_proj.weight": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.96.up_proj.weight_scale": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.97.down_proj.weight": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.97.down_proj.weight_scale": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.97.gate_proj.weight": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.97.gate_proj.weight_scale": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.97.up_proj.weight": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.97.up_proj.weight_scale": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.98.down_proj.weight": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.98.down_proj.weight_scale": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.98.gate_proj.weight": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.98.gate_proj.weight_scale": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.98.up_proj.weight": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.98.up_proj.weight_scale": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.99.down_proj.weight": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.99.down_proj.weight_scale": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.99.gate_proj.weight": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.99.gate_proj.weight_scale": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.99.up_proj.weight": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.99.up_proj.weight_scale": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.gate.e_score_correction_bias": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.gate.weight": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.shared_experts.down_proj.weight": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.shared_experts.down_proj.weight_scale": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.shared_experts.gate_proj.weight": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.shared_experts.gate_proj.weight_scale": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.shared_experts.up_proj.weight": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.shared_experts.up_proj.weight_scale": "model-00086-of-00092.safetensors",
+ "model.layers.85.post_attention_layernorm.weight": "model-00086-of-00092.safetensors",
+ "model.layers.85.self_attn.k_norm.weight": "model-00086-of-00092.safetensors",
+ "model.layers.85.self_attn.k_proj.bias": "model-00086-of-00092.safetensors",
+ "model.layers.85.self_attn.k_proj.weight": "model-00086-of-00092.safetensors",
+ "model.layers.85.self_attn.k_proj.weight_scale": "model-00086-of-00092.safetensors",
+ "model.layers.85.self_attn.o_proj.weight": "model-00086-of-00092.safetensors",
+ "model.layers.85.self_attn.o_proj.weight_scale": "model-00086-of-00092.safetensors",
+ "model.layers.85.self_attn.q_norm.weight": "model-00086-of-00092.safetensors",
+ "model.layers.85.self_attn.q_proj.bias": "model-00086-of-00092.safetensors",
+ "model.layers.85.self_attn.q_proj.weight": "model-00086-of-00092.safetensors",
+ "model.layers.85.self_attn.q_proj.weight_scale": "model-00086-of-00092.safetensors",
+ "model.layers.85.self_attn.v_proj.bias": "model-00086-of-00092.safetensors",
+ "model.layers.85.self_attn.v_proj.weight": "model-00086-of-00092.safetensors",
+ "model.layers.85.self_attn.v_proj.weight_scale": "model-00086-of-00092.safetensors",
+ "model.layers.86.input_layernorm.weight": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.0.down_proj.weight": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.0.down_proj.weight_scale": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.0.gate_proj.weight": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.0.gate_proj.weight_scale": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.0.up_proj.weight": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.0.up_proj.weight_scale": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.1.down_proj.weight": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.1.down_proj.weight_scale": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.1.gate_proj.weight": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.1.gate_proj.weight_scale": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.1.up_proj.weight": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.1.up_proj.weight_scale": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.10.down_proj.weight": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.10.down_proj.weight_scale": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.10.gate_proj.weight": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.10.gate_proj.weight_scale": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.10.up_proj.weight": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.10.up_proj.weight_scale": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.100.down_proj.weight": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.100.down_proj.weight_scale": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.100.gate_proj.weight": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.100.gate_proj.weight_scale": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.100.up_proj.weight": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.100.up_proj.weight_scale": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.101.down_proj.weight": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.101.down_proj.weight_scale": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.101.gate_proj.weight": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.101.gate_proj.weight_scale": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.101.up_proj.weight": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.101.up_proj.weight_scale": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.102.down_proj.weight": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.102.down_proj.weight_scale": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.102.gate_proj.weight": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.102.gate_proj.weight_scale": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.102.up_proj.weight": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.102.up_proj.weight_scale": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.103.down_proj.weight": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.103.down_proj.weight_scale": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.103.gate_proj.weight": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.103.gate_proj.weight_scale": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.103.up_proj.weight": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.103.up_proj.weight_scale": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.104.down_proj.weight": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.104.down_proj.weight_scale": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.104.gate_proj.weight": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.104.gate_proj.weight_scale": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.104.up_proj.weight": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.104.up_proj.weight_scale": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.105.down_proj.weight": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.105.down_proj.weight_scale": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.105.gate_proj.weight": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.105.gate_proj.weight_scale": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.105.up_proj.weight": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.105.up_proj.weight_scale": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.106.down_proj.weight": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.106.down_proj.weight_scale": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.106.gate_proj.weight": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.106.gate_proj.weight_scale": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.106.up_proj.weight": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.106.up_proj.weight_scale": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.107.down_proj.weight": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.107.down_proj.weight_scale": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.107.gate_proj.weight": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.107.gate_proj.weight_scale": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.107.up_proj.weight": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.107.up_proj.weight_scale": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.108.down_proj.weight": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.108.down_proj.weight_scale": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.108.gate_proj.weight": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.108.gate_proj.weight_scale": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.108.up_proj.weight": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.108.up_proj.weight_scale": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.109.down_proj.weight": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.109.down_proj.weight_scale": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.109.gate_proj.weight": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.109.gate_proj.weight_scale": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.109.up_proj.weight": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.109.up_proj.weight_scale": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.11.down_proj.weight": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.11.down_proj.weight_scale": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.11.gate_proj.weight": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.11.gate_proj.weight_scale": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.11.up_proj.weight": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.11.up_proj.weight_scale": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.110.down_proj.weight": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.110.down_proj.weight_scale": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.110.gate_proj.weight": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.110.gate_proj.weight_scale": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.110.up_proj.weight": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.110.up_proj.weight_scale": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.111.down_proj.weight": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.111.down_proj.weight_scale": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.111.gate_proj.weight": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.111.gate_proj.weight_scale": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.111.up_proj.weight": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.111.up_proj.weight_scale": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.112.down_proj.weight": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.112.down_proj.weight_scale": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.112.gate_proj.weight": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.112.gate_proj.weight_scale": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.112.up_proj.weight": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.112.up_proj.weight_scale": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.113.down_proj.weight": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.113.down_proj.weight_scale": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.113.gate_proj.weight": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.113.gate_proj.weight_scale": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.113.up_proj.weight": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.113.up_proj.weight_scale": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.114.down_proj.weight": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.114.down_proj.weight_scale": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.114.gate_proj.weight": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.114.gate_proj.weight_scale": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.114.up_proj.weight": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.114.up_proj.weight_scale": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.115.down_proj.weight": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.115.down_proj.weight_scale": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.115.gate_proj.weight": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.115.gate_proj.weight_scale": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.115.up_proj.weight": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.115.up_proj.weight_scale": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.116.down_proj.weight": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.116.down_proj.weight_scale": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.116.gate_proj.weight": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.116.gate_proj.weight_scale": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.116.up_proj.weight": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.116.up_proj.weight_scale": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.117.down_proj.weight": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.117.down_proj.weight_scale": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.117.gate_proj.weight": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.117.gate_proj.weight_scale": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.117.up_proj.weight": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.117.up_proj.weight_scale": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.118.down_proj.weight": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.118.down_proj.weight_scale": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.118.gate_proj.weight": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.118.gate_proj.weight_scale": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.118.up_proj.weight": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.118.up_proj.weight_scale": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.119.down_proj.weight": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.119.down_proj.weight_scale": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.119.gate_proj.weight": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.119.gate_proj.weight_scale": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.119.up_proj.weight": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.119.up_proj.weight_scale": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.12.down_proj.weight": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.12.down_proj.weight_scale": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.12.gate_proj.weight": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.12.gate_proj.weight_scale": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.12.up_proj.weight": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.12.up_proj.weight_scale": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.120.down_proj.weight": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.120.down_proj.weight_scale": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.120.gate_proj.weight": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.120.gate_proj.weight_scale": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.120.up_proj.weight": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.120.up_proj.weight_scale": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.121.down_proj.weight": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.121.down_proj.weight_scale": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.121.gate_proj.weight": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.121.gate_proj.weight_scale": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.121.up_proj.weight": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.121.up_proj.weight_scale": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.122.down_proj.weight": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.122.down_proj.weight_scale": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.122.gate_proj.weight": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.122.gate_proj.weight_scale": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.122.up_proj.weight": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.122.up_proj.weight_scale": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.123.down_proj.weight": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.123.down_proj.weight_scale": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.123.gate_proj.weight": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.123.gate_proj.weight_scale": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.123.up_proj.weight": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.123.up_proj.weight_scale": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.124.down_proj.weight": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.124.down_proj.weight_scale": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.124.gate_proj.weight": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.124.gate_proj.weight_scale": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.124.up_proj.weight": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.124.up_proj.weight_scale": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.125.down_proj.weight": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.125.down_proj.weight_scale": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.125.gate_proj.weight": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.125.gate_proj.weight_scale": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.125.up_proj.weight": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.125.up_proj.weight_scale": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.126.down_proj.weight": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.126.down_proj.weight_scale": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.126.gate_proj.weight": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.126.gate_proj.weight_scale": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.126.up_proj.weight": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.126.up_proj.weight_scale": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.127.down_proj.weight": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.127.down_proj.weight_scale": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.127.gate_proj.weight": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.127.gate_proj.weight_scale": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.127.up_proj.weight": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.127.up_proj.weight_scale": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.128.down_proj.weight": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.128.down_proj.weight_scale": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.128.gate_proj.weight": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.128.gate_proj.weight_scale": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.128.up_proj.weight": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.128.up_proj.weight_scale": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.129.down_proj.weight": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.129.down_proj.weight_scale": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.129.gate_proj.weight": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.129.gate_proj.weight_scale": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.129.up_proj.weight": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.129.up_proj.weight_scale": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.13.down_proj.weight": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.13.down_proj.weight_scale": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.13.gate_proj.weight": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.13.gate_proj.weight_scale": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.13.up_proj.weight": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.13.up_proj.weight_scale": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.130.down_proj.weight": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.130.down_proj.weight_scale": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.130.gate_proj.weight": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.130.gate_proj.weight_scale": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.130.up_proj.weight": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.130.up_proj.weight_scale": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.131.down_proj.weight": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.131.down_proj.weight_scale": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.131.gate_proj.weight": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.131.gate_proj.weight_scale": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.131.up_proj.weight": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.131.up_proj.weight_scale": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.132.down_proj.weight": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.132.down_proj.weight_scale": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.132.gate_proj.weight": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.132.gate_proj.weight_scale": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.132.up_proj.weight": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.132.up_proj.weight_scale": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.133.down_proj.weight": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.133.down_proj.weight_scale": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.133.gate_proj.weight": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.133.gate_proj.weight_scale": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.133.up_proj.weight": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.133.up_proj.weight_scale": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.134.down_proj.weight": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.134.down_proj.weight_scale": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.134.gate_proj.weight": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.134.gate_proj.weight_scale": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.134.up_proj.weight": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.134.up_proj.weight_scale": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.135.down_proj.weight": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.135.down_proj.weight_scale": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.135.gate_proj.weight": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.135.gate_proj.weight_scale": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.135.up_proj.weight": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.135.up_proj.weight_scale": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.136.down_proj.weight": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.136.down_proj.weight_scale": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.136.gate_proj.weight": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.136.gate_proj.weight_scale": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.136.up_proj.weight": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.136.up_proj.weight_scale": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.137.down_proj.weight": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.137.down_proj.weight_scale": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.137.gate_proj.weight": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.137.gate_proj.weight_scale": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.137.up_proj.weight": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.137.up_proj.weight_scale": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.138.down_proj.weight": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.138.down_proj.weight_scale": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.138.gate_proj.weight": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.138.gate_proj.weight_scale": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.138.up_proj.weight": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.138.up_proj.weight_scale": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.139.down_proj.weight": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.139.down_proj.weight_scale": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.139.gate_proj.weight": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.139.gate_proj.weight_scale": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.139.up_proj.weight": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.139.up_proj.weight_scale": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.14.down_proj.weight": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.14.down_proj.weight_scale": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.14.gate_proj.weight": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.14.gate_proj.weight_scale": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.14.up_proj.weight": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.14.up_proj.weight_scale": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.140.down_proj.weight": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.140.down_proj.weight_scale": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.140.gate_proj.weight": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.140.gate_proj.weight_scale": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.140.up_proj.weight": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.140.up_proj.weight_scale": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.141.down_proj.weight": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.141.down_proj.weight_scale": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.141.gate_proj.weight": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.141.gate_proj.weight_scale": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.141.up_proj.weight": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.141.up_proj.weight_scale": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.142.down_proj.weight": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.142.down_proj.weight_scale": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.142.gate_proj.weight": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.142.gate_proj.weight_scale": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.142.up_proj.weight": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.142.up_proj.weight_scale": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.143.down_proj.weight": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.143.down_proj.weight_scale": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.143.gate_proj.weight": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.143.gate_proj.weight_scale": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.143.up_proj.weight": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.143.up_proj.weight_scale": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.144.down_proj.weight": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.144.down_proj.weight_scale": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.144.gate_proj.weight": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.144.gate_proj.weight_scale": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.144.up_proj.weight": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.144.up_proj.weight_scale": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.145.down_proj.weight": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.145.down_proj.weight_scale": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.145.gate_proj.weight": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.145.gate_proj.weight_scale": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.145.up_proj.weight": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.145.up_proj.weight_scale": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.146.down_proj.weight": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.146.down_proj.weight_scale": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.146.gate_proj.weight": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.146.gate_proj.weight_scale": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.146.up_proj.weight": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.146.up_proj.weight_scale": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.147.down_proj.weight": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.147.down_proj.weight_scale": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.147.gate_proj.weight": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.147.gate_proj.weight_scale": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.147.up_proj.weight": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.147.up_proj.weight_scale": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.148.down_proj.weight": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.148.down_proj.weight_scale": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.148.gate_proj.weight": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.148.gate_proj.weight_scale": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.148.up_proj.weight": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.148.up_proj.weight_scale": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.149.down_proj.weight": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.149.down_proj.weight_scale": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.149.gate_proj.weight": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.149.gate_proj.weight_scale": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.149.up_proj.weight": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.149.up_proj.weight_scale": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.15.down_proj.weight": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.15.down_proj.weight_scale": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.15.gate_proj.weight": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.15.gate_proj.weight_scale": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.15.up_proj.weight": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.15.up_proj.weight_scale": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.150.down_proj.weight": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.150.down_proj.weight_scale": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.150.gate_proj.weight": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.150.gate_proj.weight_scale": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.150.up_proj.weight": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.150.up_proj.weight_scale": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.151.down_proj.weight": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.151.down_proj.weight_scale": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.151.gate_proj.weight": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.151.gate_proj.weight_scale": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.151.up_proj.weight": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.151.up_proj.weight_scale": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.152.down_proj.weight": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.152.down_proj.weight_scale": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.152.gate_proj.weight": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.152.gate_proj.weight_scale": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.152.up_proj.weight": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.152.up_proj.weight_scale": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.153.down_proj.weight": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.153.down_proj.weight_scale": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.153.gate_proj.weight": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.153.gate_proj.weight_scale": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.153.up_proj.weight": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.153.up_proj.weight_scale": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.154.down_proj.weight": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.154.down_proj.weight_scale": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.154.gate_proj.weight": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.154.gate_proj.weight_scale": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.154.up_proj.weight": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.154.up_proj.weight_scale": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.155.down_proj.weight": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.155.down_proj.weight_scale": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.155.gate_proj.weight": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.155.gate_proj.weight_scale": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.155.up_proj.weight": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.155.up_proj.weight_scale": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.156.down_proj.weight": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.156.down_proj.weight_scale": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.156.gate_proj.weight": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.156.gate_proj.weight_scale": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.156.up_proj.weight": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.156.up_proj.weight_scale": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.157.down_proj.weight": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.157.down_proj.weight_scale": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.157.gate_proj.weight": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.157.gate_proj.weight_scale": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.157.up_proj.weight": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.157.up_proj.weight_scale": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.158.down_proj.weight": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.158.down_proj.weight_scale": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.158.gate_proj.weight": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.158.gate_proj.weight_scale": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.158.up_proj.weight": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.158.up_proj.weight_scale": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.159.down_proj.weight": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.159.down_proj.weight_scale": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.159.gate_proj.weight": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.159.gate_proj.weight_scale": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.159.up_proj.weight": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.159.up_proj.weight_scale": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.16.down_proj.weight": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.16.down_proj.weight_scale": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.16.gate_proj.weight": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.16.gate_proj.weight_scale": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.16.up_proj.weight": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.16.up_proj.weight_scale": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.17.down_proj.weight": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.17.down_proj.weight_scale": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.17.gate_proj.weight": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.17.gate_proj.weight_scale": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.17.up_proj.weight": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.17.up_proj.weight_scale": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.18.down_proj.weight": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.18.down_proj.weight_scale": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.18.gate_proj.weight": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.18.gate_proj.weight_scale": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.18.up_proj.weight": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.18.up_proj.weight_scale": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.19.down_proj.weight": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.19.down_proj.weight_scale": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.19.gate_proj.weight": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.19.gate_proj.weight_scale": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.19.up_proj.weight": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.19.up_proj.weight_scale": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.2.down_proj.weight": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.2.down_proj.weight_scale": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.2.gate_proj.weight": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.2.gate_proj.weight_scale": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.2.up_proj.weight": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.2.up_proj.weight_scale": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.20.down_proj.weight": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.20.down_proj.weight_scale": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.20.gate_proj.weight": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.20.gate_proj.weight_scale": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.20.up_proj.weight": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.20.up_proj.weight_scale": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.21.down_proj.weight": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.21.down_proj.weight_scale": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.21.gate_proj.weight": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.21.gate_proj.weight_scale": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.21.up_proj.weight": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.21.up_proj.weight_scale": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.22.down_proj.weight": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.22.down_proj.weight_scale": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.22.gate_proj.weight": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.22.gate_proj.weight_scale": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.22.up_proj.weight": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.22.up_proj.weight_scale": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.23.down_proj.weight": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.23.down_proj.weight_scale": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.23.gate_proj.weight": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.23.gate_proj.weight_scale": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.23.up_proj.weight": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.23.up_proj.weight_scale": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.24.down_proj.weight": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.24.down_proj.weight_scale": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.24.gate_proj.weight": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.24.gate_proj.weight_scale": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.24.up_proj.weight": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.24.up_proj.weight_scale": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.25.down_proj.weight": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.25.down_proj.weight_scale": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.25.gate_proj.weight": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.25.gate_proj.weight_scale": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.25.up_proj.weight": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.25.up_proj.weight_scale": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.26.down_proj.weight": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.26.down_proj.weight_scale": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.26.gate_proj.weight": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.26.gate_proj.weight_scale": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.26.up_proj.weight": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.26.up_proj.weight_scale": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.27.down_proj.weight": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.27.down_proj.weight_scale": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.27.gate_proj.weight": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.27.gate_proj.weight_scale": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.27.up_proj.weight": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.27.up_proj.weight_scale": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.28.down_proj.weight": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.28.down_proj.weight_scale": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.28.gate_proj.weight": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.28.gate_proj.weight_scale": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.28.up_proj.weight": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.28.up_proj.weight_scale": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.29.down_proj.weight": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.29.down_proj.weight_scale": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.29.gate_proj.weight": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.29.gate_proj.weight_scale": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.29.up_proj.weight": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.29.up_proj.weight_scale": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.3.down_proj.weight": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.3.down_proj.weight_scale": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.3.gate_proj.weight": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.3.gate_proj.weight_scale": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.3.up_proj.weight": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.3.up_proj.weight_scale": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.30.down_proj.weight": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.30.down_proj.weight_scale": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.30.gate_proj.weight": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.30.gate_proj.weight_scale": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.30.up_proj.weight": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.30.up_proj.weight_scale": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.31.down_proj.weight": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.31.down_proj.weight_scale": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.31.gate_proj.weight": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.31.gate_proj.weight_scale": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.31.up_proj.weight": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.31.up_proj.weight_scale": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.32.down_proj.weight": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.32.down_proj.weight_scale": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.32.gate_proj.weight": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.32.gate_proj.weight_scale": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.32.up_proj.weight": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.32.up_proj.weight_scale": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.33.down_proj.weight": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.33.down_proj.weight_scale": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.33.gate_proj.weight": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.33.gate_proj.weight_scale": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.33.up_proj.weight": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.33.up_proj.weight_scale": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.34.down_proj.weight": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.34.down_proj.weight_scale": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.34.gate_proj.weight": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.34.gate_proj.weight_scale": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.34.up_proj.weight": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.34.up_proj.weight_scale": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.35.down_proj.weight": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.35.down_proj.weight_scale": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.35.gate_proj.weight": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.35.gate_proj.weight_scale": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.35.up_proj.weight": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.35.up_proj.weight_scale": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.36.down_proj.weight": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.36.down_proj.weight_scale": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.36.gate_proj.weight": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.36.gate_proj.weight_scale": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.36.up_proj.weight": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.36.up_proj.weight_scale": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.37.down_proj.weight": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.37.down_proj.weight_scale": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.37.gate_proj.weight": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.37.gate_proj.weight_scale": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.37.up_proj.weight": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.37.up_proj.weight_scale": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.38.down_proj.weight": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.38.down_proj.weight_scale": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.38.gate_proj.weight": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.38.gate_proj.weight_scale": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.38.up_proj.weight": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.38.up_proj.weight_scale": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.39.down_proj.weight": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.39.down_proj.weight_scale": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.39.gate_proj.weight": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.39.gate_proj.weight_scale": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.39.up_proj.weight": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.39.up_proj.weight_scale": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.4.down_proj.weight": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.4.down_proj.weight_scale": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.4.gate_proj.weight": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.4.gate_proj.weight_scale": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.4.up_proj.weight": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.4.up_proj.weight_scale": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.40.down_proj.weight": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.40.down_proj.weight_scale": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.40.gate_proj.weight": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.40.gate_proj.weight_scale": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.40.up_proj.weight": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.40.up_proj.weight_scale": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.41.down_proj.weight": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.41.down_proj.weight_scale": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.41.gate_proj.weight": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.41.gate_proj.weight_scale": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.41.up_proj.weight": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.41.up_proj.weight_scale": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.42.down_proj.weight": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.42.down_proj.weight_scale": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.42.gate_proj.weight": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.42.gate_proj.weight_scale": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.42.up_proj.weight": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.42.up_proj.weight_scale": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.43.down_proj.weight": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.43.down_proj.weight_scale": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.43.gate_proj.weight": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.43.gate_proj.weight_scale": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.43.up_proj.weight": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.43.up_proj.weight_scale": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.44.down_proj.weight": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.44.down_proj.weight_scale": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.44.gate_proj.weight": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.44.gate_proj.weight_scale": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.44.up_proj.weight": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.44.up_proj.weight_scale": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.45.down_proj.weight": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.45.down_proj.weight_scale": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.45.gate_proj.weight": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.45.gate_proj.weight_scale": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.45.up_proj.weight": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.45.up_proj.weight_scale": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.46.down_proj.weight": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.46.down_proj.weight_scale": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.46.gate_proj.weight": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.46.gate_proj.weight_scale": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.46.up_proj.weight": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.46.up_proj.weight_scale": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.47.down_proj.weight": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.47.down_proj.weight_scale": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.47.gate_proj.weight": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.47.gate_proj.weight_scale": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.47.up_proj.weight": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.47.up_proj.weight_scale": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.48.down_proj.weight": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.48.down_proj.weight_scale": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.48.gate_proj.weight": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.48.gate_proj.weight_scale": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.48.up_proj.weight": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.48.up_proj.weight_scale": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.49.down_proj.weight": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.49.down_proj.weight_scale": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.49.gate_proj.weight": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.49.gate_proj.weight_scale": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.49.up_proj.weight": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.49.up_proj.weight_scale": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.5.down_proj.weight": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.5.down_proj.weight_scale": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.5.gate_proj.weight": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.5.gate_proj.weight_scale": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.5.up_proj.weight": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.5.up_proj.weight_scale": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.50.down_proj.weight": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.50.down_proj.weight_scale": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.50.gate_proj.weight": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.50.gate_proj.weight_scale": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.50.up_proj.weight": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.50.up_proj.weight_scale": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.51.down_proj.weight": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.51.down_proj.weight_scale": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.51.gate_proj.weight": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.51.gate_proj.weight_scale": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.51.up_proj.weight": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.51.up_proj.weight_scale": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.52.down_proj.weight": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.52.down_proj.weight_scale": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.52.gate_proj.weight": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.52.gate_proj.weight_scale": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.52.up_proj.weight": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.52.up_proj.weight_scale": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.53.down_proj.weight": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.53.down_proj.weight_scale": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.53.gate_proj.weight": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.53.gate_proj.weight_scale": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.53.up_proj.weight": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.53.up_proj.weight_scale": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.54.down_proj.weight": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.54.down_proj.weight_scale": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.54.gate_proj.weight": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.54.gate_proj.weight_scale": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.54.up_proj.weight": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.54.up_proj.weight_scale": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.55.down_proj.weight": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.55.down_proj.weight_scale": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.55.gate_proj.weight": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.55.gate_proj.weight_scale": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.55.up_proj.weight": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.55.up_proj.weight_scale": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.56.down_proj.weight": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.56.down_proj.weight_scale": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.56.gate_proj.weight": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.56.gate_proj.weight_scale": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.56.up_proj.weight": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.56.up_proj.weight_scale": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.57.down_proj.weight": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.57.down_proj.weight_scale": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.57.gate_proj.weight": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.57.gate_proj.weight_scale": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.57.up_proj.weight": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.57.up_proj.weight_scale": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.58.down_proj.weight": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.58.down_proj.weight_scale": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.58.gate_proj.weight": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.58.gate_proj.weight_scale": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.58.up_proj.weight": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.58.up_proj.weight_scale": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.59.down_proj.weight": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.59.down_proj.weight_scale": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.59.gate_proj.weight": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.59.gate_proj.weight_scale": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.59.up_proj.weight": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.59.up_proj.weight_scale": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.6.down_proj.weight": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.6.down_proj.weight_scale": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.6.gate_proj.weight": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.6.gate_proj.weight_scale": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.6.up_proj.weight": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.6.up_proj.weight_scale": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.60.down_proj.weight": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.60.down_proj.weight_scale": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.60.gate_proj.weight": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.60.gate_proj.weight_scale": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.60.up_proj.weight": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.60.up_proj.weight_scale": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.61.down_proj.weight": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.61.down_proj.weight_scale": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.61.gate_proj.weight": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.61.gate_proj.weight_scale": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.61.up_proj.weight": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.61.up_proj.weight_scale": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.62.down_proj.weight": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.62.down_proj.weight_scale": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.62.gate_proj.weight": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.62.gate_proj.weight_scale": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.62.up_proj.weight": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.62.up_proj.weight_scale": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.63.down_proj.weight": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.63.down_proj.weight_scale": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.63.gate_proj.weight": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.63.gate_proj.weight_scale": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.63.up_proj.weight": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.63.up_proj.weight_scale": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.64.down_proj.weight": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.64.down_proj.weight_scale": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.64.gate_proj.weight": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.64.gate_proj.weight_scale": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.64.up_proj.weight": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.64.up_proj.weight_scale": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.65.down_proj.weight": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.65.down_proj.weight_scale": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.65.gate_proj.weight": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.65.gate_proj.weight_scale": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.65.up_proj.weight": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.65.up_proj.weight_scale": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.66.down_proj.weight": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.66.down_proj.weight_scale": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.66.gate_proj.weight": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.66.gate_proj.weight_scale": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.66.up_proj.weight": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.66.up_proj.weight_scale": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.67.down_proj.weight": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.67.down_proj.weight_scale": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.67.gate_proj.weight": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.67.gate_proj.weight_scale": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.67.up_proj.weight": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.67.up_proj.weight_scale": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.68.down_proj.weight": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.68.down_proj.weight_scale": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.68.gate_proj.weight": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.68.gate_proj.weight_scale": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.68.up_proj.weight": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.68.up_proj.weight_scale": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.69.down_proj.weight": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.69.down_proj.weight_scale": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.69.gate_proj.weight": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.69.gate_proj.weight_scale": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.69.up_proj.weight": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.69.up_proj.weight_scale": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.7.down_proj.weight": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.7.down_proj.weight_scale": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.7.gate_proj.weight": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.7.gate_proj.weight_scale": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.7.up_proj.weight": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.7.up_proj.weight_scale": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.70.down_proj.weight": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.70.down_proj.weight_scale": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.70.gate_proj.weight": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.70.gate_proj.weight_scale": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.70.up_proj.weight": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.70.up_proj.weight_scale": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.71.down_proj.weight": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.71.down_proj.weight_scale": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.71.gate_proj.weight": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.71.gate_proj.weight_scale": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.71.up_proj.weight": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.71.up_proj.weight_scale": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.72.down_proj.weight": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.72.down_proj.weight_scale": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.72.gate_proj.weight": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.72.gate_proj.weight_scale": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.72.up_proj.weight": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.72.up_proj.weight_scale": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.73.down_proj.weight": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.73.down_proj.weight_scale": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.73.gate_proj.weight": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.73.gate_proj.weight_scale": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.73.up_proj.weight": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.73.up_proj.weight_scale": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.74.down_proj.weight": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.74.down_proj.weight_scale": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.74.gate_proj.weight": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.74.gate_proj.weight_scale": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.74.up_proj.weight": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.74.up_proj.weight_scale": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.75.down_proj.weight": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.75.down_proj.weight_scale": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.75.gate_proj.weight": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.75.gate_proj.weight_scale": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.75.up_proj.weight": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.75.up_proj.weight_scale": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.76.down_proj.weight": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.76.down_proj.weight_scale": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.76.gate_proj.weight": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.76.gate_proj.weight_scale": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.76.up_proj.weight": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.76.up_proj.weight_scale": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.77.down_proj.weight": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.77.down_proj.weight_scale": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.77.gate_proj.weight": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.77.gate_proj.weight_scale": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.77.up_proj.weight": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.77.up_proj.weight_scale": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.78.down_proj.weight": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.78.down_proj.weight_scale": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.78.gate_proj.weight": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.78.gate_proj.weight_scale": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.78.up_proj.weight": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.78.up_proj.weight_scale": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.79.down_proj.weight": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.79.down_proj.weight_scale": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.79.gate_proj.weight": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.79.gate_proj.weight_scale": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.79.up_proj.weight": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.79.up_proj.weight_scale": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.8.down_proj.weight": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.8.down_proj.weight_scale": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.8.gate_proj.weight": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.8.gate_proj.weight_scale": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.8.up_proj.weight": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.8.up_proj.weight_scale": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.80.down_proj.weight": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.80.down_proj.weight_scale": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.80.gate_proj.weight": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.80.gate_proj.weight_scale": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.80.up_proj.weight": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.80.up_proj.weight_scale": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.81.down_proj.weight": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.81.down_proj.weight_scale": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.81.gate_proj.weight": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.81.gate_proj.weight_scale": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.81.up_proj.weight": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.81.up_proj.weight_scale": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.82.down_proj.weight": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.82.down_proj.weight_scale": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.82.gate_proj.weight": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.82.gate_proj.weight_scale": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.82.up_proj.weight": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.82.up_proj.weight_scale": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.83.down_proj.weight": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.83.down_proj.weight_scale": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.83.gate_proj.weight": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.83.gate_proj.weight_scale": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.83.up_proj.weight": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.83.up_proj.weight_scale": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.84.down_proj.weight": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.84.down_proj.weight_scale": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.84.gate_proj.weight": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.84.gate_proj.weight_scale": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.84.up_proj.weight": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.84.up_proj.weight_scale": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.85.down_proj.weight": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.85.down_proj.weight_scale": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.85.gate_proj.weight": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.85.gate_proj.weight_scale": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.85.up_proj.weight": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.85.up_proj.weight_scale": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.86.down_proj.weight": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.86.down_proj.weight_scale": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.86.gate_proj.weight": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.86.gate_proj.weight_scale": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.86.up_proj.weight": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.86.up_proj.weight_scale": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.87.down_proj.weight": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.87.down_proj.weight_scale": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.87.gate_proj.weight": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.87.gate_proj.weight_scale": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.87.up_proj.weight": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.87.up_proj.weight_scale": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.88.down_proj.weight": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.88.down_proj.weight_scale": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.88.gate_proj.weight": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.88.gate_proj.weight_scale": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.88.up_proj.weight": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.88.up_proj.weight_scale": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.89.down_proj.weight": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.89.down_proj.weight_scale": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.89.gate_proj.weight": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.89.gate_proj.weight_scale": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.89.up_proj.weight": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.89.up_proj.weight_scale": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.9.down_proj.weight": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.9.down_proj.weight_scale": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.9.gate_proj.weight": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.9.gate_proj.weight_scale": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.9.up_proj.weight": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.9.up_proj.weight_scale": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.90.down_proj.weight": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.90.down_proj.weight_scale": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.90.gate_proj.weight": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.90.gate_proj.weight_scale": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.90.up_proj.weight": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.90.up_proj.weight_scale": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.91.down_proj.weight": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.91.down_proj.weight_scale": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.91.gate_proj.weight": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.91.gate_proj.weight_scale": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.91.up_proj.weight": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.91.up_proj.weight_scale": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.92.down_proj.weight": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.92.down_proj.weight_scale": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.92.gate_proj.weight": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.92.gate_proj.weight_scale": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.92.up_proj.weight": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.92.up_proj.weight_scale": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.93.down_proj.weight": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.93.down_proj.weight_scale": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.93.gate_proj.weight": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.93.gate_proj.weight_scale": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.93.up_proj.weight": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.93.up_proj.weight_scale": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.94.down_proj.weight": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.94.down_proj.weight_scale": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.94.gate_proj.weight": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.94.gate_proj.weight_scale": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.94.up_proj.weight": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.94.up_proj.weight_scale": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.95.down_proj.weight": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.95.down_proj.weight_scale": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.95.gate_proj.weight": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.95.gate_proj.weight_scale": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.95.up_proj.weight": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.95.up_proj.weight_scale": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.96.down_proj.weight": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.96.down_proj.weight_scale": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.96.gate_proj.weight": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.96.gate_proj.weight_scale": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.96.up_proj.weight": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.96.up_proj.weight_scale": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.97.down_proj.weight": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.97.down_proj.weight_scale": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.97.gate_proj.weight": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.97.gate_proj.weight_scale": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.97.up_proj.weight": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.97.up_proj.weight_scale": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.98.down_proj.weight": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.98.down_proj.weight_scale": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.98.gate_proj.weight": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.98.gate_proj.weight_scale": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.98.up_proj.weight": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.98.up_proj.weight_scale": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.99.down_proj.weight": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.99.down_proj.weight_scale": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.99.gate_proj.weight": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.99.gate_proj.weight_scale": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.99.up_proj.weight": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.99.up_proj.weight_scale": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.gate.e_score_correction_bias": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.gate.weight": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.shared_experts.down_proj.weight": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.shared_experts.down_proj.weight_scale": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.shared_experts.gate_proj.weight": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.shared_experts.gate_proj.weight_scale": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.shared_experts.up_proj.weight": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.shared_experts.up_proj.weight_scale": "model-00087-of-00092.safetensors",
+ "model.layers.86.post_attention_layernorm.weight": "model-00087-of-00092.safetensors",
+ "model.layers.86.self_attn.k_norm.weight": "model-00087-of-00092.safetensors",
+ "model.layers.86.self_attn.k_proj.bias": "model-00087-of-00092.safetensors",
+ "model.layers.86.self_attn.k_proj.weight": "model-00087-of-00092.safetensors",
+ "model.layers.86.self_attn.k_proj.weight_scale": "model-00087-of-00092.safetensors",
+ "model.layers.86.self_attn.o_proj.weight": "model-00087-of-00092.safetensors",
+ "model.layers.86.self_attn.o_proj.weight_scale": "model-00087-of-00092.safetensors",
+ "model.layers.86.self_attn.q_norm.weight": "model-00087-of-00092.safetensors",
+ "model.layers.86.self_attn.q_proj.bias": "model-00087-of-00092.safetensors",
+ "model.layers.86.self_attn.q_proj.weight": "model-00087-of-00092.safetensors",
+ "model.layers.86.self_attn.q_proj.weight_scale": "model-00087-of-00092.safetensors",
+ "model.layers.86.self_attn.v_proj.bias": "model-00087-of-00092.safetensors",
+ "model.layers.86.self_attn.v_proj.weight": "model-00087-of-00092.safetensors",
+ "model.layers.86.self_attn.v_proj.weight_scale": "model-00087-of-00092.safetensors",
+ "model.layers.87.input_layernorm.weight": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.0.down_proj.weight": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.0.down_proj.weight_scale": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.0.gate_proj.weight": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.0.gate_proj.weight_scale": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.0.up_proj.weight": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.0.up_proj.weight_scale": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.1.down_proj.weight": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.1.down_proj.weight_scale": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.1.gate_proj.weight": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.1.gate_proj.weight_scale": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.1.up_proj.weight": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.1.up_proj.weight_scale": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.10.down_proj.weight": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.10.down_proj.weight_scale": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.10.gate_proj.weight": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.10.gate_proj.weight_scale": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.10.up_proj.weight": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.10.up_proj.weight_scale": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.100.down_proj.weight": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.100.down_proj.weight_scale": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.100.gate_proj.weight": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.100.gate_proj.weight_scale": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.100.up_proj.weight": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.100.up_proj.weight_scale": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.101.down_proj.weight": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.101.down_proj.weight_scale": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.101.gate_proj.weight": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.101.gate_proj.weight_scale": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.101.up_proj.weight": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.101.up_proj.weight_scale": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.102.down_proj.weight": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.102.down_proj.weight_scale": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.102.gate_proj.weight": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.102.gate_proj.weight_scale": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.102.up_proj.weight": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.102.up_proj.weight_scale": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.103.down_proj.weight": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.103.down_proj.weight_scale": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.103.gate_proj.weight": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.103.gate_proj.weight_scale": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.103.up_proj.weight": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.103.up_proj.weight_scale": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.104.down_proj.weight": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.104.down_proj.weight_scale": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.104.gate_proj.weight": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.104.gate_proj.weight_scale": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.104.up_proj.weight": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.104.up_proj.weight_scale": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.105.down_proj.weight": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.105.down_proj.weight_scale": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.105.gate_proj.weight": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.105.gate_proj.weight_scale": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.105.up_proj.weight": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.105.up_proj.weight_scale": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.106.down_proj.weight": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.106.down_proj.weight_scale": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.106.gate_proj.weight": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.106.gate_proj.weight_scale": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.106.up_proj.weight": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.106.up_proj.weight_scale": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.107.down_proj.weight": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.107.down_proj.weight_scale": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.107.gate_proj.weight": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.107.gate_proj.weight_scale": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.107.up_proj.weight": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.107.up_proj.weight_scale": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.108.down_proj.weight": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.108.down_proj.weight_scale": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.108.gate_proj.weight": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.108.gate_proj.weight_scale": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.108.up_proj.weight": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.108.up_proj.weight_scale": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.109.down_proj.weight": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.109.down_proj.weight_scale": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.109.gate_proj.weight": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.109.gate_proj.weight_scale": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.109.up_proj.weight": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.109.up_proj.weight_scale": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.11.down_proj.weight": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.11.down_proj.weight_scale": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.11.gate_proj.weight": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.11.gate_proj.weight_scale": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.11.up_proj.weight": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.11.up_proj.weight_scale": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.110.down_proj.weight": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.110.down_proj.weight_scale": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.110.gate_proj.weight": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.110.gate_proj.weight_scale": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.110.up_proj.weight": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.110.up_proj.weight_scale": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.111.down_proj.weight": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.111.down_proj.weight_scale": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.111.gate_proj.weight": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.111.gate_proj.weight_scale": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.111.up_proj.weight": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.111.up_proj.weight_scale": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.112.down_proj.weight": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.112.down_proj.weight_scale": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.112.gate_proj.weight": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.112.gate_proj.weight_scale": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.112.up_proj.weight": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.112.up_proj.weight_scale": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.113.down_proj.weight": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.113.down_proj.weight_scale": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.113.gate_proj.weight": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.113.gate_proj.weight_scale": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.113.up_proj.weight": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.113.up_proj.weight_scale": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.114.down_proj.weight": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.114.down_proj.weight_scale": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.114.gate_proj.weight": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.114.gate_proj.weight_scale": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.114.up_proj.weight": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.114.up_proj.weight_scale": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.115.down_proj.weight": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.115.down_proj.weight_scale": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.115.gate_proj.weight": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.115.gate_proj.weight_scale": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.115.up_proj.weight": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.115.up_proj.weight_scale": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.116.down_proj.weight": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.116.down_proj.weight_scale": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.116.gate_proj.weight": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.116.gate_proj.weight_scale": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.116.up_proj.weight": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.116.up_proj.weight_scale": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.117.down_proj.weight": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.117.down_proj.weight_scale": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.117.gate_proj.weight": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.117.gate_proj.weight_scale": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.117.up_proj.weight": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.117.up_proj.weight_scale": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.118.down_proj.weight": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.118.down_proj.weight_scale": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.118.gate_proj.weight": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.118.gate_proj.weight_scale": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.118.up_proj.weight": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.118.up_proj.weight_scale": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.119.down_proj.weight": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.119.down_proj.weight_scale": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.119.gate_proj.weight": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.119.gate_proj.weight_scale": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.119.up_proj.weight": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.119.up_proj.weight_scale": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.12.down_proj.weight": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.12.down_proj.weight_scale": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.12.gate_proj.weight": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.12.gate_proj.weight_scale": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.12.up_proj.weight": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.12.up_proj.weight_scale": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.120.down_proj.weight": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.120.down_proj.weight_scale": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.120.gate_proj.weight": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.120.gate_proj.weight_scale": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.120.up_proj.weight": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.120.up_proj.weight_scale": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.121.down_proj.weight": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.121.down_proj.weight_scale": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.121.gate_proj.weight": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.121.gate_proj.weight_scale": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.121.up_proj.weight": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.121.up_proj.weight_scale": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.122.down_proj.weight": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.122.down_proj.weight_scale": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.122.gate_proj.weight": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.122.gate_proj.weight_scale": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.122.up_proj.weight": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.122.up_proj.weight_scale": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.123.down_proj.weight": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.123.down_proj.weight_scale": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.123.gate_proj.weight": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.123.gate_proj.weight_scale": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.123.up_proj.weight": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.123.up_proj.weight_scale": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.124.down_proj.weight": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.124.down_proj.weight_scale": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.124.gate_proj.weight": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.124.gate_proj.weight_scale": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.124.up_proj.weight": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.124.up_proj.weight_scale": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.125.down_proj.weight": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.125.down_proj.weight_scale": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.125.gate_proj.weight": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.125.gate_proj.weight_scale": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.125.up_proj.weight": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.125.up_proj.weight_scale": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.126.down_proj.weight": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.126.down_proj.weight_scale": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.126.gate_proj.weight": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.126.gate_proj.weight_scale": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.126.up_proj.weight": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.126.up_proj.weight_scale": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.127.down_proj.weight": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.127.down_proj.weight_scale": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.127.gate_proj.weight": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.127.gate_proj.weight_scale": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.127.up_proj.weight": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.127.up_proj.weight_scale": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.128.down_proj.weight": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.128.down_proj.weight_scale": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.128.gate_proj.weight": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.128.gate_proj.weight_scale": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.128.up_proj.weight": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.128.up_proj.weight_scale": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.129.down_proj.weight": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.129.down_proj.weight_scale": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.129.gate_proj.weight": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.129.gate_proj.weight_scale": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.129.up_proj.weight": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.129.up_proj.weight_scale": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.13.down_proj.weight": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.13.down_proj.weight_scale": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.13.gate_proj.weight": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.13.gate_proj.weight_scale": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.13.up_proj.weight": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.13.up_proj.weight_scale": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.130.down_proj.weight": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.130.down_proj.weight_scale": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.130.gate_proj.weight": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.130.gate_proj.weight_scale": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.130.up_proj.weight": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.130.up_proj.weight_scale": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.131.down_proj.weight": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.131.down_proj.weight_scale": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.131.gate_proj.weight": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.131.gate_proj.weight_scale": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.131.up_proj.weight": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.131.up_proj.weight_scale": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.132.down_proj.weight": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.132.down_proj.weight_scale": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.132.gate_proj.weight": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.132.gate_proj.weight_scale": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.132.up_proj.weight": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.132.up_proj.weight_scale": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.133.down_proj.weight": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.133.down_proj.weight_scale": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.133.gate_proj.weight": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.133.gate_proj.weight_scale": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.133.up_proj.weight": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.133.up_proj.weight_scale": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.134.down_proj.weight": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.134.down_proj.weight_scale": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.134.gate_proj.weight": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.134.gate_proj.weight_scale": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.134.up_proj.weight": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.134.up_proj.weight_scale": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.135.down_proj.weight": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.135.down_proj.weight_scale": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.135.gate_proj.weight": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.135.gate_proj.weight_scale": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.135.up_proj.weight": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.135.up_proj.weight_scale": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.136.down_proj.weight": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.136.down_proj.weight_scale": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.136.gate_proj.weight": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.136.gate_proj.weight_scale": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.136.up_proj.weight": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.136.up_proj.weight_scale": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.137.down_proj.weight": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.137.down_proj.weight_scale": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.137.gate_proj.weight": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.137.gate_proj.weight_scale": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.137.up_proj.weight": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.137.up_proj.weight_scale": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.138.down_proj.weight": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.138.down_proj.weight_scale": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.138.gate_proj.weight": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.138.gate_proj.weight_scale": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.138.up_proj.weight": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.138.up_proj.weight_scale": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.139.down_proj.weight": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.139.down_proj.weight_scale": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.139.gate_proj.weight": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.139.gate_proj.weight_scale": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.139.up_proj.weight": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.139.up_proj.weight_scale": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.14.down_proj.weight": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.14.down_proj.weight_scale": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.14.gate_proj.weight": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.14.gate_proj.weight_scale": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.14.up_proj.weight": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.14.up_proj.weight_scale": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.140.down_proj.weight": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.140.down_proj.weight_scale": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.140.gate_proj.weight": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.140.gate_proj.weight_scale": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.140.up_proj.weight": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.140.up_proj.weight_scale": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.141.down_proj.weight": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.141.down_proj.weight_scale": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.141.gate_proj.weight": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.141.gate_proj.weight_scale": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.141.up_proj.weight": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.141.up_proj.weight_scale": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.142.down_proj.weight": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.142.down_proj.weight_scale": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.142.gate_proj.weight": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.142.gate_proj.weight_scale": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.142.up_proj.weight": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.142.up_proj.weight_scale": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.143.down_proj.weight": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.143.down_proj.weight_scale": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.143.gate_proj.weight": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.143.gate_proj.weight_scale": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.143.up_proj.weight": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.143.up_proj.weight_scale": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.144.down_proj.weight": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.144.down_proj.weight_scale": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.144.gate_proj.weight": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.144.gate_proj.weight_scale": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.144.up_proj.weight": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.144.up_proj.weight_scale": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.145.down_proj.weight": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.145.down_proj.weight_scale": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.145.gate_proj.weight": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.145.gate_proj.weight_scale": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.145.up_proj.weight": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.145.up_proj.weight_scale": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.146.down_proj.weight": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.146.down_proj.weight_scale": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.146.gate_proj.weight": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.146.gate_proj.weight_scale": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.146.up_proj.weight": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.146.up_proj.weight_scale": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.147.down_proj.weight": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.147.down_proj.weight_scale": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.147.gate_proj.weight": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.147.gate_proj.weight_scale": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.147.up_proj.weight": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.147.up_proj.weight_scale": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.148.down_proj.weight": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.148.down_proj.weight_scale": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.148.gate_proj.weight": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.148.gate_proj.weight_scale": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.148.up_proj.weight": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.148.up_proj.weight_scale": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.149.down_proj.weight": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.149.down_proj.weight_scale": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.149.gate_proj.weight": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.149.gate_proj.weight_scale": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.149.up_proj.weight": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.149.up_proj.weight_scale": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.15.down_proj.weight": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.15.down_proj.weight_scale": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.15.gate_proj.weight": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.15.gate_proj.weight_scale": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.15.up_proj.weight": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.15.up_proj.weight_scale": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.150.down_proj.weight": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.150.down_proj.weight_scale": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.150.gate_proj.weight": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.150.gate_proj.weight_scale": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.150.up_proj.weight": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.150.up_proj.weight_scale": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.151.down_proj.weight": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.151.down_proj.weight_scale": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.151.gate_proj.weight": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.151.gate_proj.weight_scale": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.151.up_proj.weight": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.151.up_proj.weight_scale": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.152.down_proj.weight": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.152.down_proj.weight_scale": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.152.gate_proj.weight": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.152.gate_proj.weight_scale": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.152.up_proj.weight": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.152.up_proj.weight_scale": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.153.down_proj.weight": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.153.down_proj.weight_scale": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.153.gate_proj.weight": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.153.gate_proj.weight_scale": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.153.up_proj.weight": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.153.up_proj.weight_scale": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.154.down_proj.weight": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.154.down_proj.weight_scale": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.154.gate_proj.weight": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.154.gate_proj.weight_scale": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.154.up_proj.weight": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.154.up_proj.weight_scale": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.155.down_proj.weight": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.155.down_proj.weight_scale": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.155.gate_proj.weight": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.155.gate_proj.weight_scale": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.155.up_proj.weight": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.155.up_proj.weight_scale": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.156.down_proj.weight": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.156.down_proj.weight_scale": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.156.gate_proj.weight": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.156.gate_proj.weight_scale": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.156.up_proj.weight": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.156.up_proj.weight_scale": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.157.down_proj.weight": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.157.down_proj.weight_scale": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.157.gate_proj.weight": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.157.gate_proj.weight_scale": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.157.up_proj.weight": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.157.up_proj.weight_scale": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.158.down_proj.weight": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.158.down_proj.weight_scale": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.158.gate_proj.weight": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.158.gate_proj.weight_scale": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.158.up_proj.weight": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.158.up_proj.weight_scale": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.159.down_proj.weight": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.159.down_proj.weight_scale": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.159.gate_proj.weight": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.159.gate_proj.weight_scale": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.159.up_proj.weight": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.159.up_proj.weight_scale": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.16.down_proj.weight": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.16.down_proj.weight_scale": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.16.gate_proj.weight": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.16.gate_proj.weight_scale": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.16.up_proj.weight": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.16.up_proj.weight_scale": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.17.down_proj.weight": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.17.down_proj.weight_scale": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.17.gate_proj.weight": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.17.gate_proj.weight_scale": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.17.up_proj.weight": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.17.up_proj.weight_scale": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.18.down_proj.weight": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.18.down_proj.weight_scale": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.18.gate_proj.weight": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.18.gate_proj.weight_scale": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.18.up_proj.weight": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.18.up_proj.weight_scale": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.19.down_proj.weight": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.19.down_proj.weight_scale": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.19.gate_proj.weight": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.19.gate_proj.weight_scale": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.19.up_proj.weight": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.19.up_proj.weight_scale": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.2.down_proj.weight": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.2.down_proj.weight_scale": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.2.gate_proj.weight": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.2.gate_proj.weight_scale": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.2.up_proj.weight": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.2.up_proj.weight_scale": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.20.down_proj.weight": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.20.down_proj.weight_scale": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.20.gate_proj.weight": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.20.gate_proj.weight_scale": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.20.up_proj.weight": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.20.up_proj.weight_scale": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.21.down_proj.weight": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.21.down_proj.weight_scale": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.21.gate_proj.weight": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.21.gate_proj.weight_scale": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.21.up_proj.weight": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.21.up_proj.weight_scale": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.22.down_proj.weight": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.22.down_proj.weight_scale": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.22.gate_proj.weight": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.22.gate_proj.weight_scale": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.22.up_proj.weight": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.22.up_proj.weight_scale": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.23.down_proj.weight": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.23.down_proj.weight_scale": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.23.gate_proj.weight": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.23.gate_proj.weight_scale": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.23.up_proj.weight": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.23.up_proj.weight_scale": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.24.down_proj.weight": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.24.down_proj.weight_scale": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.24.gate_proj.weight": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.24.gate_proj.weight_scale": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.24.up_proj.weight": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.24.up_proj.weight_scale": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.25.down_proj.weight": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.25.down_proj.weight_scale": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.25.gate_proj.weight": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.25.gate_proj.weight_scale": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.25.up_proj.weight": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.25.up_proj.weight_scale": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.26.down_proj.weight": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.26.down_proj.weight_scale": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.26.gate_proj.weight": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.26.gate_proj.weight_scale": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.26.up_proj.weight": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.26.up_proj.weight_scale": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.27.down_proj.weight": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.27.down_proj.weight_scale": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.27.gate_proj.weight": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.27.gate_proj.weight_scale": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.27.up_proj.weight": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.27.up_proj.weight_scale": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.28.down_proj.weight": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.28.down_proj.weight_scale": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.28.gate_proj.weight": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.28.gate_proj.weight_scale": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.28.up_proj.weight": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.28.up_proj.weight_scale": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.29.down_proj.weight": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.29.down_proj.weight_scale": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.29.gate_proj.weight": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.29.gate_proj.weight_scale": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.29.up_proj.weight": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.29.up_proj.weight_scale": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.3.down_proj.weight": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.3.down_proj.weight_scale": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.3.gate_proj.weight": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.3.gate_proj.weight_scale": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.3.up_proj.weight": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.3.up_proj.weight_scale": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.30.down_proj.weight": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.30.down_proj.weight_scale": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.30.gate_proj.weight": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.30.gate_proj.weight_scale": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.30.up_proj.weight": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.30.up_proj.weight_scale": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.31.down_proj.weight": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.31.down_proj.weight_scale": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.31.gate_proj.weight": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.31.gate_proj.weight_scale": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.31.up_proj.weight": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.31.up_proj.weight_scale": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.32.down_proj.weight": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.32.down_proj.weight_scale": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.32.gate_proj.weight": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.32.gate_proj.weight_scale": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.32.up_proj.weight": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.32.up_proj.weight_scale": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.33.down_proj.weight": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.33.down_proj.weight_scale": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.33.gate_proj.weight": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.33.gate_proj.weight_scale": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.33.up_proj.weight": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.33.up_proj.weight_scale": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.34.down_proj.weight": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.34.down_proj.weight_scale": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.34.gate_proj.weight": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.34.gate_proj.weight_scale": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.34.up_proj.weight": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.34.up_proj.weight_scale": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.35.down_proj.weight": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.35.down_proj.weight_scale": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.35.gate_proj.weight": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.35.gate_proj.weight_scale": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.35.up_proj.weight": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.35.up_proj.weight_scale": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.36.down_proj.weight": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.36.down_proj.weight_scale": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.36.gate_proj.weight": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.36.gate_proj.weight_scale": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.36.up_proj.weight": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.36.up_proj.weight_scale": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.37.down_proj.weight": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.37.down_proj.weight_scale": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.37.gate_proj.weight": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.37.gate_proj.weight_scale": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.37.up_proj.weight": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.37.up_proj.weight_scale": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.38.down_proj.weight": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.38.down_proj.weight_scale": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.38.gate_proj.weight": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.38.gate_proj.weight_scale": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.38.up_proj.weight": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.38.up_proj.weight_scale": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.39.down_proj.weight": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.39.down_proj.weight_scale": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.39.gate_proj.weight": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.39.gate_proj.weight_scale": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.39.up_proj.weight": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.39.up_proj.weight_scale": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.4.down_proj.weight": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.4.down_proj.weight_scale": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.4.gate_proj.weight": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.4.gate_proj.weight_scale": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.4.up_proj.weight": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.4.up_proj.weight_scale": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.40.down_proj.weight": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.40.down_proj.weight_scale": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.40.gate_proj.weight": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.40.gate_proj.weight_scale": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.40.up_proj.weight": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.40.up_proj.weight_scale": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.41.down_proj.weight": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.41.down_proj.weight_scale": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.41.gate_proj.weight": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.41.gate_proj.weight_scale": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.41.up_proj.weight": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.41.up_proj.weight_scale": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.42.down_proj.weight": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.42.down_proj.weight_scale": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.42.gate_proj.weight": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.42.gate_proj.weight_scale": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.42.up_proj.weight": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.42.up_proj.weight_scale": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.43.down_proj.weight": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.43.down_proj.weight_scale": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.43.gate_proj.weight": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.43.gate_proj.weight_scale": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.43.up_proj.weight": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.43.up_proj.weight_scale": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.44.down_proj.weight": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.44.down_proj.weight_scale": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.44.gate_proj.weight": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.44.gate_proj.weight_scale": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.44.up_proj.weight": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.44.up_proj.weight_scale": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.45.down_proj.weight": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.45.down_proj.weight_scale": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.45.gate_proj.weight": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.45.gate_proj.weight_scale": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.45.up_proj.weight": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.45.up_proj.weight_scale": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.46.down_proj.weight": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.46.down_proj.weight_scale": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.46.gate_proj.weight": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.46.gate_proj.weight_scale": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.46.up_proj.weight": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.46.up_proj.weight_scale": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.47.down_proj.weight": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.47.down_proj.weight_scale": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.47.gate_proj.weight": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.47.gate_proj.weight_scale": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.47.up_proj.weight": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.47.up_proj.weight_scale": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.48.down_proj.weight": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.48.down_proj.weight_scale": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.48.gate_proj.weight": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.48.gate_proj.weight_scale": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.48.up_proj.weight": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.48.up_proj.weight_scale": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.49.down_proj.weight": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.49.down_proj.weight_scale": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.49.gate_proj.weight": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.49.gate_proj.weight_scale": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.49.up_proj.weight": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.49.up_proj.weight_scale": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.5.down_proj.weight": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.5.down_proj.weight_scale": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.5.gate_proj.weight": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.5.gate_proj.weight_scale": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.5.up_proj.weight": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.5.up_proj.weight_scale": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.50.down_proj.weight": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.50.down_proj.weight_scale": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.50.gate_proj.weight": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.50.gate_proj.weight_scale": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.50.up_proj.weight": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.50.up_proj.weight_scale": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.51.down_proj.weight": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.51.down_proj.weight_scale": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.51.gate_proj.weight": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.51.gate_proj.weight_scale": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.51.up_proj.weight": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.51.up_proj.weight_scale": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.52.down_proj.weight": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.52.down_proj.weight_scale": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.52.gate_proj.weight": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.52.gate_proj.weight_scale": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.52.up_proj.weight": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.52.up_proj.weight_scale": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.53.down_proj.weight": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.53.down_proj.weight_scale": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.53.gate_proj.weight": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.53.gate_proj.weight_scale": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.53.up_proj.weight": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.53.up_proj.weight_scale": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.54.down_proj.weight": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.54.down_proj.weight_scale": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.54.gate_proj.weight": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.54.gate_proj.weight_scale": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.54.up_proj.weight": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.54.up_proj.weight_scale": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.55.down_proj.weight": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.55.down_proj.weight_scale": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.55.gate_proj.weight": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.55.gate_proj.weight_scale": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.55.up_proj.weight": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.55.up_proj.weight_scale": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.56.down_proj.weight": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.56.down_proj.weight_scale": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.56.gate_proj.weight": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.56.gate_proj.weight_scale": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.56.up_proj.weight": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.56.up_proj.weight_scale": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.57.down_proj.weight": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.57.down_proj.weight_scale": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.57.gate_proj.weight": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.57.gate_proj.weight_scale": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.57.up_proj.weight": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.57.up_proj.weight_scale": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.58.down_proj.weight": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.58.down_proj.weight_scale": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.58.gate_proj.weight": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.58.gate_proj.weight_scale": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.58.up_proj.weight": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.58.up_proj.weight_scale": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.59.down_proj.weight": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.59.down_proj.weight_scale": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.59.gate_proj.weight": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.59.gate_proj.weight_scale": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.59.up_proj.weight": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.59.up_proj.weight_scale": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.6.down_proj.weight": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.6.down_proj.weight_scale": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.6.gate_proj.weight": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.6.gate_proj.weight_scale": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.6.up_proj.weight": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.6.up_proj.weight_scale": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.60.down_proj.weight": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.60.down_proj.weight_scale": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.60.gate_proj.weight": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.60.gate_proj.weight_scale": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.60.up_proj.weight": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.60.up_proj.weight_scale": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.61.down_proj.weight": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.61.down_proj.weight_scale": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.61.gate_proj.weight": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.61.gate_proj.weight_scale": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.61.up_proj.weight": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.61.up_proj.weight_scale": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.62.down_proj.weight": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.62.down_proj.weight_scale": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.62.gate_proj.weight": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.62.gate_proj.weight_scale": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.62.up_proj.weight": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.62.up_proj.weight_scale": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.63.down_proj.weight": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.63.down_proj.weight_scale": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.63.gate_proj.weight": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.63.gate_proj.weight_scale": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.63.up_proj.weight": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.63.up_proj.weight_scale": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.64.down_proj.weight": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.64.down_proj.weight_scale": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.64.gate_proj.weight": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.64.gate_proj.weight_scale": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.64.up_proj.weight": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.64.up_proj.weight_scale": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.65.down_proj.weight": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.65.down_proj.weight_scale": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.65.gate_proj.weight": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.65.gate_proj.weight_scale": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.65.up_proj.weight": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.65.up_proj.weight_scale": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.66.down_proj.weight": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.66.down_proj.weight_scale": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.66.gate_proj.weight": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.66.gate_proj.weight_scale": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.66.up_proj.weight": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.66.up_proj.weight_scale": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.67.down_proj.weight": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.67.down_proj.weight_scale": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.67.gate_proj.weight": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.67.gate_proj.weight_scale": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.67.up_proj.weight": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.67.up_proj.weight_scale": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.68.down_proj.weight": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.68.down_proj.weight_scale": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.68.gate_proj.weight": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.68.gate_proj.weight_scale": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.68.up_proj.weight": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.68.up_proj.weight_scale": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.69.down_proj.weight": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.69.down_proj.weight_scale": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.69.gate_proj.weight": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.69.gate_proj.weight_scale": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.69.up_proj.weight": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.69.up_proj.weight_scale": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.7.down_proj.weight": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.7.down_proj.weight_scale": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.7.gate_proj.weight": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.7.gate_proj.weight_scale": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.7.up_proj.weight": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.7.up_proj.weight_scale": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.70.down_proj.weight": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.70.down_proj.weight_scale": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.70.gate_proj.weight": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.70.gate_proj.weight_scale": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.70.up_proj.weight": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.70.up_proj.weight_scale": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.71.down_proj.weight": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.71.down_proj.weight_scale": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.71.gate_proj.weight": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.71.gate_proj.weight_scale": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.71.up_proj.weight": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.71.up_proj.weight_scale": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.72.down_proj.weight": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.72.down_proj.weight_scale": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.72.gate_proj.weight": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.72.gate_proj.weight_scale": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.72.up_proj.weight": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.72.up_proj.weight_scale": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.73.down_proj.weight": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.73.down_proj.weight_scale": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.73.gate_proj.weight": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.73.gate_proj.weight_scale": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.73.up_proj.weight": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.73.up_proj.weight_scale": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.74.down_proj.weight": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.74.down_proj.weight_scale": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.74.gate_proj.weight": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.74.gate_proj.weight_scale": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.74.up_proj.weight": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.74.up_proj.weight_scale": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.75.down_proj.weight": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.75.down_proj.weight_scale": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.75.gate_proj.weight": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.75.gate_proj.weight_scale": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.75.up_proj.weight": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.75.up_proj.weight_scale": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.76.down_proj.weight": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.76.down_proj.weight_scale": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.76.gate_proj.weight": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.76.gate_proj.weight_scale": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.76.up_proj.weight": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.76.up_proj.weight_scale": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.77.down_proj.weight": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.77.down_proj.weight_scale": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.77.gate_proj.weight": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.77.gate_proj.weight_scale": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.77.up_proj.weight": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.77.up_proj.weight_scale": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.78.down_proj.weight": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.78.down_proj.weight_scale": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.78.gate_proj.weight": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.78.gate_proj.weight_scale": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.78.up_proj.weight": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.78.up_proj.weight_scale": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.79.down_proj.weight": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.79.down_proj.weight_scale": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.79.gate_proj.weight": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.79.gate_proj.weight_scale": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.79.up_proj.weight": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.79.up_proj.weight_scale": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.8.down_proj.weight": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.8.down_proj.weight_scale": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.8.gate_proj.weight": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.8.gate_proj.weight_scale": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.8.up_proj.weight": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.8.up_proj.weight_scale": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.80.down_proj.weight": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.80.down_proj.weight_scale": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.80.gate_proj.weight": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.80.gate_proj.weight_scale": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.80.up_proj.weight": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.80.up_proj.weight_scale": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.81.down_proj.weight": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.81.down_proj.weight_scale": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.81.gate_proj.weight": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.81.gate_proj.weight_scale": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.81.up_proj.weight": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.81.up_proj.weight_scale": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.82.down_proj.weight": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.82.down_proj.weight_scale": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.82.gate_proj.weight": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.82.gate_proj.weight_scale": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.82.up_proj.weight": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.82.up_proj.weight_scale": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.83.down_proj.weight": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.83.down_proj.weight_scale": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.83.gate_proj.weight": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.83.gate_proj.weight_scale": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.83.up_proj.weight": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.83.up_proj.weight_scale": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.84.down_proj.weight": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.84.down_proj.weight_scale": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.84.gate_proj.weight": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.84.gate_proj.weight_scale": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.84.up_proj.weight": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.84.up_proj.weight_scale": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.85.down_proj.weight": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.85.down_proj.weight_scale": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.85.gate_proj.weight": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.85.gate_proj.weight_scale": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.85.up_proj.weight": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.85.up_proj.weight_scale": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.86.down_proj.weight": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.86.down_proj.weight_scale": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.86.gate_proj.weight": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.86.gate_proj.weight_scale": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.86.up_proj.weight": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.86.up_proj.weight_scale": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.87.down_proj.weight": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.87.down_proj.weight_scale": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.87.gate_proj.weight": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.87.gate_proj.weight_scale": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.87.up_proj.weight": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.87.up_proj.weight_scale": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.88.down_proj.weight": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.88.down_proj.weight_scale": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.88.gate_proj.weight": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.88.gate_proj.weight_scale": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.88.up_proj.weight": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.88.up_proj.weight_scale": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.89.down_proj.weight": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.89.down_proj.weight_scale": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.89.gate_proj.weight": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.89.gate_proj.weight_scale": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.89.up_proj.weight": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.89.up_proj.weight_scale": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.9.down_proj.weight": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.9.down_proj.weight_scale": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.9.gate_proj.weight": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.9.gate_proj.weight_scale": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.9.up_proj.weight": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.9.up_proj.weight_scale": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.90.down_proj.weight": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.90.down_proj.weight_scale": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.90.gate_proj.weight": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.90.gate_proj.weight_scale": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.90.up_proj.weight": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.90.up_proj.weight_scale": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.91.down_proj.weight": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.91.down_proj.weight_scale": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.91.gate_proj.weight": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.91.gate_proj.weight_scale": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.91.up_proj.weight": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.91.up_proj.weight_scale": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.92.down_proj.weight": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.92.down_proj.weight_scale": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.92.gate_proj.weight": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.92.gate_proj.weight_scale": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.92.up_proj.weight": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.92.up_proj.weight_scale": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.93.down_proj.weight": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.93.down_proj.weight_scale": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.93.gate_proj.weight": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.93.gate_proj.weight_scale": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.93.up_proj.weight": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.93.up_proj.weight_scale": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.94.down_proj.weight": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.94.down_proj.weight_scale": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.94.gate_proj.weight": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.94.gate_proj.weight_scale": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.94.up_proj.weight": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.94.up_proj.weight_scale": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.95.down_proj.weight": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.95.down_proj.weight_scale": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.95.gate_proj.weight": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.95.gate_proj.weight_scale": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.95.up_proj.weight": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.95.up_proj.weight_scale": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.96.down_proj.weight": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.96.down_proj.weight_scale": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.96.gate_proj.weight": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.96.gate_proj.weight_scale": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.96.up_proj.weight": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.96.up_proj.weight_scale": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.97.down_proj.weight": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.97.down_proj.weight_scale": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.97.gate_proj.weight": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.97.gate_proj.weight_scale": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.97.up_proj.weight": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.97.up_proj.weight_scale": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.98.down_proj.weight": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.98.down_proj.weight_scale": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.98.gate_proj.weight": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.98.gate_proj.weight_scale": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.98.up_proj.weight": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.98.up_proj.weight_scale": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.99.down_proj.weight": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.99.down_proj.weight_scale": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.99.gate_proj.weight": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.99.gate_proj.weight_scale": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.99.up_proj.weight": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.99.up_proj.weight_scale": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.gate.e_score_correction_bias": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.gate.weight": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.shared_experts.down_proj.weight": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.shared_experts.down_proj.weight_scale": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.shared_experts.gate_proj.weight": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.shared_experts.gate_proj.weight_scale": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.shared_experts.up_proj.weight": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.shared_experts.up_proj.weight_scale": "model-00088-of-00092.safetensors",
+ "model.layers.87.post_attention_layernorm.weight": "model-00088-of-00092.safetensors",
+ "model.layers.87.self_attn.k_norm.weight": "model-00088-of-00092.safetensors",
+ "model.layers.87.self_attn.k_proj.bias": "model-00088-of-00092.safetensors",
+ "model.layers.87.self_attn.k_proj.weight": "model-00088-of-00092.safetensors",
+ "model.layers.87.self_attn.k_proj.weight_scale": "model-00088-of-00092.safetensors",
+ "model.layers.87.self_attn.o_proj.weight": "model-00088-of-00092.safetensors",
+ "model.layers.87.self_attn.o_proj.weight_scale": "model-00088-of-00092.safetensors",
+ "model.layers.87.self_attn.q_norm.weight": "model-00088-of-00092.safetensors",
+ "model.layers.87.self_attn.q_proj.bias": "model-00088-of-00092.safetensors",
+ "model.layers.87.self_attn.q_proj.weight": "model-00088-of-00092.safetensors",
+ "model.layers.87.self_attn.q_proj.weight_scale": "model-00088-of-00092.safetensors",
+ "model.layers.87.self_attn.v_proj.bias": "model-00088-of-00092.safetensors",
+ "model.layers.87.self_attn.v_proj.weight": "model-00088-of-00092.safetensors",
+ "model.layers.87.self_attn.v_proj.weight_scale": "model-00088-of-00092.safetensors",
+ "model.layers.88.input_layernorm.weight": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.0.down_proj.weight": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.0.down_proj.weight_scale": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.0.gate_proj.weight": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.0.gate_proj.weight_scale": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.0.up_proj.weight": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.0.up_proj.weight_scale": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.1.down_proj.weight": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.1.down_proj.weight_scale": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.1.gate_proj.weight": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.1.gate_proj.weight_scale": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.1.up_proj.weight": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.1.up_proj.weight_scale": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.10.down_proj.weight": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.10.down_proj.weight_scale": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.10.gate_proj.weight": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.10.gate_proj.weight_scale": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.10.up_proj.weight": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.10.up_proj.weight_scale": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.100.down_proj.weight": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.100.down_proj.weight_scale": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.100.gate_proj.weight": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.100.gate_proj.weight_scale": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.100.up_proj.weight": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.100.up_proj.weight_scale": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.101.down_proj.weight": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.101.down_proj.weight_scale": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.101.gate_proj.weight": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.101.gate_proj.weight_scale": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.101.up_proj.weight": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.101.up_proj.weight_scale": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.102.down_proj.weight": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.102.down_proj.weight_scale": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.102.gate_proj.weight": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.102.gate_proj.weight_scale": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.102.up_proj.weight": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.102.up_proj.weight_scale": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.103.down_proj.weight": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.103.down_proj.weight_scale": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.103.gate_proj.weight": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.103.gate_proj.weight_scale": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.103.up_proj.weight": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.103.up_proj.weight_scale": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.104.down_proj.weight": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.104.down_proj.weight_scale": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.104.gate_proj.weight": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.104.gate_proj.weight_scale": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.104.up_proj.weight": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.104.up_proj.weight_scale": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.105.down_proj.weight": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.105.down_proj.weight_scale": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.105.gate_proj.weight": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.105.gate_proj.weight_scale": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.105.up_proj.weight": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.105.up_proj.weight_scale": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.106.down_proj.weight": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.106.down_proj.weight_scale": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.106.gate_proj.weight": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.106.gate_proj.weight_scale": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.106.up_proj.weight": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.106.up_proj.weight_scale": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.107.down_proj.weight": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.107.down_proj.weight_scale": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.107.gate_proj.weight": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.107.gate_proj.weight_scale": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.107.up_proj.weight": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.107.up_proj.weight_scale": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.108.down_proj.weight": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.108.down_proj.weight_scale": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.108.gate_proj.weight": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.108.gate_proj.weight_scale": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.108.up_proj.weight": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.108.up_proj.weight_scale": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.109.down_proj.weight": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.109.down_proj.weight_scale": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.109.gate_proj.weight": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.109.gate_proj.weight_scale": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.109.up_proj.weight": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.109.up_proj.weight_scale": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.11.down_proj.weight": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.11.down_proj.weight_scale": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.11.gate_proj.weight": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.11.gate_proj.weight_scale": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.11.up_proj.weight": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.11.up_proj.weight_scale": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.110.down_proj.weight": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.110.down_proj.weight_scale": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.110.gate_proj.weight": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.110.gate_proj.weight_scale": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.110.up_proj.weight": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.110.up_proj.weight_scale": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.111.down_proj.weight": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.111.down_proj.weight_scale": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.111.gate_proj.weight": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.111.gate_proj.weight_scale": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.111.up_proj.weight": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.111.up_proj.weight_scale": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.112.down_proj.weight": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.112.down_proj.weight_scale": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.112.gate_proj.weight": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.112.gate_proj.weight_scale": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.112.up_proj.weight": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.112.up_proj.weight_scale": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.113.down_proj.weight": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.113.down_proj.weight_scale": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.113.gate_proj.weight": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.113.gate_proj.weight_scale": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.113.up_proj.weight": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.113.up_proj.weight_scale": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.114.down_proj.weight": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.114.down_proj.weight_scale": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.114.gate_proj.weight": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.114.gate_proj.weight_scale": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.114.up_proj.weight": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.114.up_proj.weight_scale": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.115.down_proj.weight": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.115.down_proj.weight_scale": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.115.gate_proj.weight": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.115.gate_proj.weight_scale": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.115.up_proj.weight": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.115.up_proj.weight_scale": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.116.down_proj.weight": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.116.down_proj.weight_scale": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.116.gate_proj.weight": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.116.gate_proj.weight_scale": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.116.up_proj.weight": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.116.up_proj.weight_scale": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.117.down_proj.weight": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.117.down_proj.weight_scale": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.117.gate_proj.weight": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.117.gate_proj.weight_scale": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.117.up_proj.weight": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.117.up_proj.weight_scale": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.118.down_proj.weight": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.118.down_proj.weight_scale": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.118.gate_proj.weight": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.118.gate_proj.weight_scale": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.118.up_proj.weight": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.118.up_proj.weight_scale": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.119.down_proj.weight": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.119.down_proj.weight_scale": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.119.gate_proj.weight": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.119.gate_proj.weight_scale": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.119.up_proj.weight": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.119.up_proj.weight_scale": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.12.down_proj.weight": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.12.down_proj.weight_scale": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.12.gate_proj.weight": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.12.gate_proj.weight_scale": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.12.up_proj.weight": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.12.up_proj.weight_scale": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.120.down_proj.weight": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.120.down_proj.weight_scale": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.120.gate_proj.weight": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.120.gate_proj.weight_scale": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.120.up_proj.weight": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.120.up_proj.weight_scale": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.121.down_proj.weight": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.121.down_proj.weight_scale": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.121.gate_proj.weight": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.121.gate_proj.weight_scale": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.121.up_proj.weight": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.121.up_proj.weight_scale": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.122.down_proj.weight": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.122.down_proj.weight_scale": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.122.gate_proj.weight": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.122.gate_proj.weight_scale": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.122.up_proj.weight": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.122.up_proj.weight_scale": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.123.down_proj.weight": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.123.down_proj.weight_scale": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.123.gate_proj.weight": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.123.gate_proj.weight_scale": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.123.up_proj.weight": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.123.up_proj.weight_scale": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.124.down_proj.weight": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.124.down_proj.weight_scale": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.124.gate_proj.weight": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.124.gate_proj.weight_scale": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.124.up_proj.weight": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.124.up_proj.weight_scale": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.125.down_proj.weight": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.125.down_proj.weight_scale": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.125.gate_proj.weight": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.125.gate_proj.weight_scale": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.125.up_proj.weight": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.125.up_proj.weight_scale": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.126.down_proj.weight": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.126.down_proj.weight_scale": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.126.gate_proj.weight": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.126.gate_proj.weight_scale": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.126.up_proj.weight": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.126.up_proj.weight_scale": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.127.down_proj.weight": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.127.down_proj.weight_scale": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.127.gate_proj.weight": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.127.gate_proj.weight_scale": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.127.up_proj.weight": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.127.up_proj.weight_scale": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.128.down_proj.weight": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.128.down_proj.weight_scale": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.128.gate_proj.weight": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.128.gate_proj.weight_scale": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.128.up_proj.weight": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.128.up_proj.weight_scale": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.129.down_proj.weight": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.129.down_proj.weight_scale": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.129.gate_proj.weight": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.129.gate_proj.weight_scale": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.129.up_proj.weight": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.129.up_proj.weight_scale": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.13.down_proj.weight": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.13.down_proj.weight_scale": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.13.gate_proj.weight": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.13.gate_proj.weight_scale": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.13.up_proj.weight": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.13.up_proj.weight_scale": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.130.down_proj.weight": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.130.down_proj.weight_scale": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.130.gate_proj.weight": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.130.gate_proj.weight_scale": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.130.up_proj.weight": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.130.up_proj.weight_scale": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.131.down_proj.weight": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.131.down_proj.weight_scale": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.131.gate_proj.weight": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.131.gate_proj.weight_scale": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.131.up_proj.weight": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.131.up_proj.weight_scale": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.132.down_proj.weight": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.132.down_proj.weight_scale": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.132.gate_proj.weight": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.132.gate_proj.weight_scale": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.132.up_proj.weight": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.132.up_proj.weight_scale": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.133.down_proj.weight": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.133.down_proj.weight_scale": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.133.gate_proj.weight": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.133.gate_proj.weight_scale": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.133.up_proj.weight": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.133.up_proj.weight_scale": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.134.down_proj.weight": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.134.down_proj.weight_scale": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.134.gate_proj.weight": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.134.gate_proj.weight_scale": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.134.up_proj.weight": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.134.up_proj.weight_scale": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.135.down_proj.weight": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.135.down_proj.weight_scale": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.135.gate_proj.weight": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.135.gate_proj.weight_scale": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.135.up_proj.weight": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.135.up_proj.weight_scale": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.136.down_proj.weight": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.136.down_proj.weight_scale": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.136.gate_proj.weight": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.136.gate_proj.weight_scale": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.136.up_proj.weight": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.136.up_proj.weight_scale": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.137.down_proj.weight": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.137.down_proj.weight_scale": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.137.gate_proj.weight": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.137.gate_proj.weight_scale": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.137.up_proj.weight": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.137.up_proj.weight_scale": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.138.down_proj.weight": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.138.down_proj.weight_scale": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.138.gate_proj.weight": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.138.gate_proj.weight_scale": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.138.up_proj.weight": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.138.up_proj.weight_scale": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.139.down_proj.weight": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.139.down_proj.weight_scale": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.139.gate_proj.weight": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.139.gate_proj.weight_scale": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.139.up_proj.weight": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.139.up_proj.weight_scale": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.14.down_proj.weight": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.14.down_proj.weight_scale": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.14.gate_proj.weight": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.14.gate_proj.weight_scale": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.14.up_proj.weight": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.14.up_proj.weight_scale": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.140.down_proj.weight": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.140.down_proj.weight_scale": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.140.gate_proj.weight": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.140.gate_proj.weight_scale": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.140.up_proj.weight": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.140.up_proj.weight_scale": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.141.down_proj.weight": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.141.down_proj.weight_scale": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.141.gate_proj.weight": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.141.gate_proj.weight_scale": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.141.up_proj.weight": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.141.up_proj.weight_scale": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.142.down_proj.weight": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.142.down_proj.weight_scale": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.142.gate_proj.weight": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.142.gate_proj.weight_scale": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.142.up_proj.weight": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.142.up_proj.weight_scale": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.143.down_proj.weight": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.143.down_proj.weight_scale": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.143.gate_proj.weight": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.143.gate_proj.weight_scale": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.143.up_proj.weight": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.143.up_proj.weight_scale": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.144.down_proj.weight": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.144.down_proj.weight_scale": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.144.gate_proj.weight": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.144.gate_proj.weight_scale": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.144.up_proj.weight": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.144.up_proj.weight_scale": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.145.down_proj.weight": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.145.down_proj.weight_scale": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.145.gate_proj.weight": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.145.gate_proj.weight_scale": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.145.up_proj.weight": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.145.up_proj.weight_scale": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.146.down_proj.weight": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.146.down_proj.weight_scale": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.146.gate_proj.weight": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.146.gate_proj.weight_scale": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.146.up_proj.weight": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.146.up_proj.weight_scale": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.147.down_proj.weight": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.147.down_proj.weight_scale": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.147.gate_proj.weight": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.147.gate_proj.weight_scale": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.147.up_proj.weight": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.147.up_proj.weight_scale": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.148.down_proj.weight": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.148.down_proj.weight_scale": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.148.gate_proj.weight": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.148.gate_proj.weight_scale": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.148.up_proj.weight": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.148.up_proj.weight_scale": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.149.down_proj.weight": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.149.down_proj.weight_scale": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.149.gate_proj.weight": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.149.gate_proj.weight_scale": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.149.up_proj.weight": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.149.up_proj.weight_scale": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.15.down_proj.weight": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.15.down_proj.weight_scale": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.15.gate_proj.weight": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.15.gate_proj.weight_scale": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.15.up_proj.weight": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.15.up_proj.weight_scale": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.150.down_proj.weight": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.150.down_proj.weight_scale": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.150.gate_proj.weight": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.150.gate_proj.weight_scale": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.150.up_proj.weight": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.150.up_proj.weight_scale": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.151.down_proj.weight": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.151.down_proj.weight_scale": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.151.gate_proj.weight": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.151.gate_proj.weight_scale": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.151.up_proj.weight": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.151.up_proj.weight_scale": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.152.down_proj.weight": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.152.down_proj.weight_scale": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.152.gate_proj.weight": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.152.gate_proj.weight_scale": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.152.up_proj.weight": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.152.up_proj.weight_scale": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.153.down_proj.weight": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.153.down_proj.weight_scale": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.153.gate_proj.weight": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.153.gate_proj.weight_scale": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.153.up_proj.weight": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.153.up_proj.weight_scale": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.154.down_proj.weight": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.154.down_proj.weight_scale": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.154.gate_proj.weight": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.154.gate_proj.weight_scale": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.154.up_proj.weight": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.154.up_proj.weight_scale": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.155.down_proj.weight": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.155.down_proj.weight_scale": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.155.gate_proj.weight": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.155.gate_proj.weight_scale": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.155.up_proj.weight": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.155.up_proj.weight_scale": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.156.down_proj.weight": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.156.down_proj.weight_scale": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.156.gate_proj.weight": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.156.gate_proj.weight_scale": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.156.up_proj.weight": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.156.up_proj.weight_scale": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.157.down_proj.weight": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.157.down_proj.weight_scale": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.157.gate_proj.weight": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.157.gate_proj.weight_scale": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.157.up_proj.weight": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.157.up_proj.weight_scale": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.158.down_proj.weight": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.158.down_proj.weight_scale": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.158.gate_proj.weight": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.158.gate_proj.weight_scale": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.158.up_proj.weight": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.158.up_proj.weight_scale": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.159.down_proj.weight": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.159.down_proj.weight_scale": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.159.gate_proj.weight": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.159.gate_proj.weight_scale": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.159.up_proj.weight": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.159.up_proj.weight_scale": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.16.down_proj.weight": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.16.down_proj.weight_scale": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.16.gate_proj.weight": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.16.gate_proj.weight_scale": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.16.up_proj.weight": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.16.up_proj.weight_scale": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.17.down_proj.weight": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.17.down_proj.weight_scale": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.17.gate_proj.weight": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.17.gate_proj.weight_scale": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.17.up_proj.weight": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.17.up_proj.weight_scale": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.18.down_proj.weight": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.18.down_proj.weight_scale": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.18.gate_proj.weight": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.18.gate_proj.weight_scale": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.18.up_proj.weight": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.18.up_proj.weight_scale": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.19.down_proj.weight": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.19.down_proj.weight_scale": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.19.gate_proj.weight": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.19.gate_proj.weight_scale": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.19.up_proj.weight": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.19.up_proj.weight_scale": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.2.down_proj.weight": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.2.down_proj.weight_scale": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.2.gate_proj.weight": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.2.gate_proj.weight_scale": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.2.up_proj.weight": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.2.up_proj.weight_scale": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.20.down_proj.weight": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.20.down_proj.weight_scale": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.20.gate_proj.weight": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.20.gate_proj.weight_scale": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.20.up_proj.weight": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.20.up_proj.weight_scale": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.21.down_proj.weight": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.21.down_proj.weight_scale": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.21.gate_proj.weight": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.21.gate_proj.weight_scale": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.21.up_proj.weight": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.21.up_proj.weight_scale": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.22.down_proj.weight": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.22.down_proj.weight_scale": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.22.gate_proj.weight": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.22.gate_proj.weight_scale": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.22.up_proj.weight": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.22.up_proj.weight_scale": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.23.down_proj.weight": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.23.down_proj.weight_scale": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.23.gate_proj.weight": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.23.gate_proj.weight_scale": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.23.up_proj.weight": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.23.up_proj.weight_scale": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.24.down_proj.weight": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.24.down_proj.weight_scale": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.24.gate_proj.weight": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.24.gate_proj.weight_scale": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.24.up_proj.weight": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.24.up_proj.weight_scale": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.25.down_proj.weight": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.25.down_proj.weight_scale": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.25.gate_proj.weight": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.25.gate_proj.weight_scale": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.25.up_proj.weight": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.25.up_proj.weight_scale": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.26.down_proj.weight": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.26.down_proj.weight_scale": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.26.gate_proj.weight": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.26.gate_proj.weight_scale": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.26.up_proj.weight": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.26.up_proj.weight_scale": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.27.down_proj.weight": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.27.down_proj.weight_scale": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.27.gate_proj.weight": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.27.gate_proj.weight_scale": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.27.up_proj.weight": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.27.up_proj.weight_scale": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.28.down_proj.weight": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.28.down_proj.weight_scale": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.28.gate_proj.weight": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.28.gate_proj.weight_scale": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.28.up_proj.weight": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.28.up_proj.weight_scale": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.29.down_proj.weight": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.29.down_proj.weight_scale": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.29.gate_proj.weight": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.29.gate_proj.weight_scale": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.29.up_proj.weight": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.29.up_proj.weight_scale": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.3.down_proj.weight": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.3.down_proj.weight_scale": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.3.gate_proj.weight": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.3.gate_proj.weight_scale": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.3.up_proj.weight": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.3.up_proj.weight_scale": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.30.down_proj.weight": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.30.down_proj.weight_scale": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.30.gate_proj.weight": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.30.gate_proj.weight_scale": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.30.up_proj.weight": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.30.up_proj.weight_scale": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.31.down_proj.weight": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.31.down_proj.weight_scale": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.31.gate_proj.weight": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.31.gate_proj.weight_scale": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.31.up_proj.weight": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.31.up_proj.weight_scale": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.32.down_proj.weight": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.32.down_proj.weight_scale": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.32.gate_proj.weight": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.32.gate_proj.weight_scale": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.32.up_proj.weight": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.32.up_proj.weight_scale": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.33.down_proj.weight": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.33.down_proj.weight_scale": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.33.gate_proj.weight": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.33.gate_proj.weight_scale": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.33.up_proj.weight": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.33.up_proj.weight_scale": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.34.down_proj.weight": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.34.down_proj.weight_scale": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.34.gate_proj.weight": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.34.gate_proj.weight_scale": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.34.up_proj.weight": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.34.up_proj.weight_scale": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.35.down_proj.weight": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.35.down_proj.weight_scale": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.35.gate_proj.weight": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.35.gate_proj.weight_scale": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.35.up_proj.weight": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.35.up_proj.weight_scale": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.36.down_proj.weight": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.36.down_proj.weight_scale": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.36.gate_proj.weight": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.36.gate_proj.weight_scale": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.36.up_proj.weight": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.36.up_proj.weight_scale": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.37.down_proj.weight": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.37.down_proj.weight_scale": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.37.gate_proj.weight": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.37.gate_proj.weight_scale": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.37.up_proj.weight": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.37.up_proj.weight_scale": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.38.down_proj.weight": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.38.down_proj.weight_scale": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.38.gate_proj.weight": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.38.gate_proj.weight_scale": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.38.up_proj.weight": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.38.up_proj.weight_scale": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.39.down_proj.weight": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.39.down_proj.weight_scale": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.39.gate_proj.weight": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.39.gate_proj.weight_scale": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.39.up_proj.weight": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.39.up_proj.weight_scale": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.4.down_proj.weight": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.4.down_proj.weight_scale": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.4.gate_proj.weight": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.4.gate_proj.weight_scale": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.4.up_proj.weight": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.4.up_proj.weight_scale": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.40.down_proj.weight": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.40.down_proj.weight_scale": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.40.gate_proj.weight": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.40.gate_proj.weight_scale": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.40.up_proj.weight": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.40.up_proj.weight_scale": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.41.down_proj.weight": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.41.down_proj.weight_scale": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.41.gate_proj.weight": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.41.gate_proj.weight_scale": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.41.up_proj.weight": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.41.up_proj.weight_scale": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.42.down_proj.weight": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.42.down_proj.weight_scale": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.42.gate_proj.weight": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.42.gate_proj.weight_scale": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.42.up_proj.weight": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.42.up_proj.weight_scale": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.43.down_proj.weight": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.43.down_proj.weight_scale": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.43.gate_proj.weight": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.43.gate_proj.weight_scale": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.43.up_proj.weight": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.43.up_proj.weight_scale": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.44.down_proj.weight": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.44.down_proj.weight_scale": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.44.gate_proj.weight": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.44.gate_proj.weight_scale": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.44.up_proj.weight": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.44.up_proj.weight_scale": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.45.down_proj.weight": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.45.down_proj.weight_scale": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.45.gate_proj.weight": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.45.gate_proj.weight_scale": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.45.up_proj.weight": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.45.up_proj.weight_scale": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.46.down_proj.weight": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.46.down_proj.weight_scale": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.46.gate_proj.weight": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.46.gate_proj.weight_scale": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.46.up_proj.weight": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.46.up_proj.weight_scale": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.47.down_proj.weight": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.47.down_proj.weight_scale": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.47.gate_proj.weight": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.47.gate_proj.weight_scale": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.47.up_proj.weight": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.47.up_proj.weight_scale": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.48.down_proj.weight": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.48.down_proj.weight_scale": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.48.gate_proj.weight": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.48.gate_proj.weight_scale": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.48.up_proj.weight": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.48.up_proj.weight_scale": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.49.down_proj.weight": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.49.down_proj.weight_scale": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.49.gate_proj.weight": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.49.gate_proj.weight_scale": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.49.up_proj.weight": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.49.up_proj.weight_scale": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.5.down_proj.weight": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.5.down_proj.weight_scale": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.5.gate_proj.weight": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.5.gate_proj.weight_scale": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.5.up_proj.weight": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.5.up_proj.weight_scale": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.50.down_proj.weight": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.50.down_proj.weight_scale": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.50.gate_proj.weight": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.50.gate_proj.weight_scale": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.50.up_proj.weight": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.50.up_proj.weight_scale": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.51.down_proj.weight": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.51.down_proj.weight_scale": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.51.gate_proj.weight": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.51.gate_proj.weight_scale": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.51.up_proj.weight": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.51.up_proj.weight_scale": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.52.down_proj.weight": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.52.down_proj.weight_scale": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.52.gate_proj.weight": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.52.gate_proj.weight_scale": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.52.up_proj.weight": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.52.up_proj.weight_scale": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.53.down_proj.weight": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.53.down_proj.weight_scale": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.53.gate_proj.weight": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.53.gate_proj.weight_scale": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.53.up_proj.weight": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.53.up_proj.weight_scale": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.54.down_proj.weight": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.54.down_proj.weight_scale": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.54.gate_proj.weight": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.54.gate_proj.weight_scale": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.54.up_proj.weight": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.54.up_proj.weight_scale": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.55.down_proj.weight": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.55.down_proj.weight_scale": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.55.gate_proj.weight": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.55.gate_proj.weight_scale": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.55.up_proj.weight": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.55.up_proj.weight_scale": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.56.down_proj.weight": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.56.down_proj.weight_scale": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.56.gate_proj.weight": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.56.gate_proj.weight_scale": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.56.up_proj.weight": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.56.up_proj.weight_scale": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.57.down_proj.weight": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.57.down_proj.weight_scale": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.57.gate_proj.weight": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.57.gate_proj.weight_scale": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.57.up_proj.weight": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.57.up_proj.weight_scale": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.58.down_proj.weight": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.58.down_proj.weight_scale": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.58.gate_proj.weight": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.58.gate_proj.weight_scale": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.58.up_proj.weight": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.58.up_proj.weight_scale": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.59.down_proj.weight": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.59.down_proj.weight_scale": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.59.gate_proj.weight": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.59.gate_proj.weight_scale": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.59.up_proj.weight": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.59.up_proj.weight_scale": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.6.down_proj.weight": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.6.down_proj.weight_scale": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.6.gate_proj.weight": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.6.gate_proj.weight_scale": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.6.up_proj.weight": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.6.up_proj.weight_scale": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.60.down_proj.weight": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.60.down_proj.weight_scale": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.60.gate_proj.weight": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.60.gate_proj.weight_scale": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.60.up_proj.weight": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.60.up_proj.weight_scale": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.61.down_proj.weight": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.61.down_proj.weight_scale": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.61.gate_proj.weight": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.61.gate_proj.weight_scale": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.61.up_proj.weight": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.61.up_proj.weight_scale": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.62.down_proj.weight": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.62.down_proj.weight_scale": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.62.gate_proj.weight": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.62.gate_proj.weight_scale": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.62.up_proj.weight": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.62.up_proj.weight_scale": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.63.down_proj.weight": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.63.down_proj.weight_scale": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.63.gate_proj.weight": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.63.gate_proj.weight_scale": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.63.up_proj.weight": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.63.up_proj.weight_scale": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.64.down_proj.weight": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.64.down_proj.weight_scale": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.64.gate_proj.weight": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.64.gate_proj.weight_scale": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.64.up_proj.weight": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.64.up_proj.weight_scale": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.65.down_proj.weight": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.65.down_proj.weight_scale": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.65.gate_proj.weight": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.65.gate_proj.weight_scale": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.65.up_proj.weight": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.65.up_proj.weight_scale": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.66.down_proj.weight": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.66.down_proj.weight_scale": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.66.gate_proj.weight": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.66.gate_proj.weight_scale": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.66.up_proj.weight": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.66.up_proj.weight_scale": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.67.down_proj.weight": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.67.down_proj.weight_scale": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.67.gate_proj.weight": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.67.gate_proj.weight_scale": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.67.up_proj.weight": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.67.up_proj.weight_scale": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.68.down_proj.weight": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.68.down_proj.weight_scale": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.68.gate_proj.weight": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.68.gate_proj.weight_scale": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.68.up_proj.weight": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.68.up_proj.weight_scale": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.69.down_proj.weight": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.69.down_proj.weight_scale": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.69.gate_proj.weight": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.69.gate_proj.weight_scale": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.69.up_proj.weight": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.69.up_proj.weight_scale": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.7.down_proj.weight": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.7.down_proj.weight_scale": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.7.gate_proj.weight": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.7.gate_proj.weight_scale": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.7.up_proj.weight": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.7.up_proj.weight_scale": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.70.down_proj.weight": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.70.down_proj.weight_scale": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.70.gate_proj.weight": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.70.gate_proj.weight_scale": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.70.up_proj.weight": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.70.up_proj.weight_scale": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.71.down_proj.weight": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.71.down_proj.weight_scale": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.71.gate_proj.weight": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.71.gate_proj.weight_scale": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.71.up_proj.weight": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.71.up_proj.weight_scale": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.72.down_proj.weight": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.72.down_proj.weight_scale": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.72.gate_proj.weight": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.72.gate_proj.weight_scale": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.72.up_proj.weight": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.72.up_proj.weight_scale": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.73.down_proj.weight": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.73.down_proj.weight_scale": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.73.gate_proj.weight": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.73.gate_proj.weight_scale": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.73.up_proj.weight": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.73.up_proj.weight_scale": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.74.down_proj.weight": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.74.down_proj.weight_scale": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.74.gate_proj.weight": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.74.gate_proj.weight_scale": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.74.up_proj.weight": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.74.up_proj.weight_scale": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.75.down_proj.weight": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.75.down_proj.weight_scale": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.75.gate_proj.weight": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.75.gate_proj.weight_scale": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.75.up_proj.weight": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.75.up_proj.weight_scale": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.76.down_proj.weight": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.76.down_proj.weight_scale": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.76.gate_proj.weight": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.76.gate_proj.weight_scale": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.76.up_proj.weight": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.76.up_proj.weight_scale": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.77.down_proj.weight": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.77.down_proj.weight_scale": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.77.gate_proj.weight": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.77.gate_proj.weight_scale": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.77.up_proj.weight": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.77.up_proj.weight_scale": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.78.down_proj.weight": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.78.down_proj.weight_scale": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.78.gate_proj.weight": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.78.gate_proj.weight_scale": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.78.up_proj.weight": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.78.up_proj.weight_scale": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.79.down_proj.weight": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.79.down_proj.weight_scale": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.79.gate_proj.weight": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.79.gate_proj.weight_scale": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.79.up_proj.weight": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.79.up_proj.weight_scale": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.8.down_proj.weight": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.8.down_proj.weight_scale": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.8.gate_proj.weight": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.8.gate_proj.weight_scale": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.8.up_proj.weight": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.8.up_proj.weight_scale": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.80.down_proj.weight": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.80.down_proj.weight_scale": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.80.gate_proj.weight": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.80.gate_proj.weight_scale": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.80.up_proj.weight": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.80.up_proj.weight_scale": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.81.down_proj.weight": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.81.down_proj.weight_scale": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.81.gate_proj.weight": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.81.gate_proj.weight_scale": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.81.up_proj.weight": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.81.up_proj.weight_scale": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.82.down_proj.weight": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.82.down_proj.weight_scale": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.82.gate_proj.weight": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.82.gate_proj.weight_scale": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.82.up_proj.weight": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.82.up_proj.weight_scale": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.83.down_proj.weight": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.83.down_proj.weight_scale": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.83.gate_proj.weight": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.83.gate_proj.weight_scale": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.83.up_proj.weight": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.83.up_proj.weight_scale": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.84.down_proj.weight": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.84.down_proj.weight_scale": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.84.gate_proj.weight": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.84.gate_proj.weight_scale": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.84.up_proj.weight": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.84.up_proj.weight_scale": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.85.down_proj.weight": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.85.down_proj.weight_scale": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.85.gate_proj.weight": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.85.gate_proj.weight_scale": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.85.up_proj.weight": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.85.up_proj.weight_scale": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.86.down_proj.weight": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.86.down_proj.weight_scale": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.86.gate_proj.weight": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.86.gate_proj.weight_scale": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.86.up_proj.weight": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.86.up_proj.weight_scale": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.87.down_proj.weight": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.87.down_proj.weight_scale": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.87.gate_proj.weight": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.87.gate_proj.weight_scale": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.87.up_proj.weight": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.87.up_proj.weight_scale": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.88.down_proj.weight": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.88.down_proj.weight_scale": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.88.gate_proj.weight": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.88.gate_proj.weight_scale": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.88.up_proj.weight": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.88.up_proj.weight_scale": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.89.down_proj.weight": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.89.down_proj.weight_scale": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.89.gate_proj.weight": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.89.gate_proj.weight_scale": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.89.up_proj.weight": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.89.up_proj.weight_scale": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.9.down_proj.weight": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.9.down_proj.weight_scale": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.9.gate_proj.weight": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.9.gate_proj.weight_scale": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.9.up_proj.weight": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.9.up_proj.weight_scale": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.90.down_proj.weight": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.90.down_proj.weight_scale": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.90.gate_proj.weight": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.90.gate_proj.weight_scale": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.90.up_proj.weight": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.90.up_proj.weight_scale": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.91.down_proj.weight": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.91.down_proj.weight_scale": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.91.gate_proj.weight": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.91.gate_proj.weight_scale": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.91.up_proj.weight": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.91.up_proj.weight_scale": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.92.down_proj.weight": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.92.down_proj.weight_scale": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.92.gate_proj.weight": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.92.gate_proj.weight_scale": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.92.up_proj.weight": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.92.up_proj.weight_scale": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.93.down_proj.weight": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.93.down_proj.weight_scale": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.93.gate_proj.weight": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.93.gate_proj.weight_scale": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.93.up_proj.weight": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.93.up_proj.weight_scale": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.94.down_proj.weight": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.94.down_proj.weight_scale": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.94.gate_proj.weight": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.94.gate_proj.weight_scale": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.94.up_proj.weight": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.94.up_proj.weight_scale": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.95.down_proj.weight": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.95.down_proj.weight_scale": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.95.gate_proj.weight": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.95.gate_proj.weight_scale": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.95.up_proj.weight": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.95.up_proj.weight_scale": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.96.down_proj.weight": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.96.down_proj.weight_scale": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.96.gate_proj.weight": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.96.gate_proj.weight_scale": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.96.up_proj.weight": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.96.up_proj.weight_scale": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.97.down_proj.weight": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.97.down_proj.weight_scale": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.97.gate_proj.weight": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.97.gate_proj.weight_scale": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.97.up_proj.weight": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.97.up_proj.weight_scale": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.98.down_proj.weight": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.98.down_proj.weight_scale": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.98.gate_proj.weight": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.98.gate_proj.weight_scale": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.98.up_proj.weight": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.98.up_proj.weight_scale": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.99.down_proj.weight": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.99.down_proj.weight_scale": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.99.gate_proj.weight": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.99.gate_proj.weight_scale": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.99.up_proj.weight": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.99.up_proj.weight_scale": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.gate.e_score_correction_bias": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.gate.weight": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.shared_experts.down_proj.weight": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.shared_experts.down_proj.weight_scale": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.shared_experts.gate_proj.weight": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.shared_experts.gate_proj.weight_scale": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.shared_experts.up_proj.weight": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.shared_experts.up_proj.weight_scale": "model-00089-of-00092.safetensors",
+ "model.layers.88.post_attention_layernorm.weight": "model-00089-of-00092.safetensors",
+ "model.layers.88.self_attn.k_norm.weight": "model-00089-of-00092.safetensors",
+ "model.layers.88.self_attn.k_proj.bias": "model-00089-of-00092.safetensors",
+ "model.layers.88.self_attn.k_proj.weight": "model-00089-of-00092.safetensors",
+ "model.layers.88.self_attn.k_proj.weight_scale": "model-00089-of-00092.safetensors",
+ "model.layers.88.self_attn.o_proj.weight": "model-00089-of-00092.safetensors",
+ "model.layers.88.self_attn.o_proj.weight_scale": "model-00089-of-00092.safetensors",
+ "model.layers.88.self_attn.q_norm.weight": "model-00089-of-00092.safetensors",
+ "model.layers.88.self_attn.q_proj.bias": "model-00089-of-00092.safetensors",
+ "model.layers.88.self_attn.q_proj.weight": "model-00089-of-00092.safetensors",
+ "model.layers.88.self_attn.q_proj.weight_scale": "model-00089-of-00092.safetensors",
+ "model.layers.88.self_attn.v_proj.bias": "model-00089-of-00092.safetensors",
+ "model.layers.88.self_attn.v_proj.weight": "model-00089-of-00092.safetensors",
+ "model.layers.88.self_attn.v_proj.weight_scale": "model-00089-of-00092.safetensors",
+ "model.layers.89.input_layernorm.weight": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.0.down_proj.weight": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.0.down_proj.weight_scale": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.0.gate_proj.weight": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.0.gate_proj.weight_scale": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.0.up_proj.weight": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.0.up_proj.weight_scale": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.1.down_proj.weight": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.1.down_proj.weight_scale": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.1.gate_proj.weight": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.1.gate_proj.weight_scale": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.1.up_proj.weight": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.1.up_proj.weight_scale": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.10.down_proj.weight": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.10.down_proj.weight_scale": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.10.gate_proj.weight": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.10.gate_proj.weight_scale": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.10.up_proj.weight": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.10.up_proj.weight_scale": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.100.down_proj.weight": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.100.down_proj.weight_scale": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.100.gate_proj.weight": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.100.gate_proj.weight_scale": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.100.up_proj.weight": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.100.up_proj.weight_scale": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.101.down_proj.weight": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.101.down_proj.weight_scale": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.101.gate_proj.weight": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.101.gate_proj.weight_scale": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.101.up_proj.weight": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.101.up_proj.weight_scale": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.102.down_proj.weight": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.102.down_proj.weight_scale": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.102.gate_proj.weight": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.102.gate_proj.weight_scale": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.102.up_proj.weight": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.102.up_proj.weight_scale": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.103.down_proj.weight": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.103.down_proj.weight_scale": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.103.gate_proj.weight": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.103.gate_proj.weight_scale": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.103.up_proj.weight": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.103.up_proj.weight_scale": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.104.down_proj.weight": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.104.down_proj.weight_scale": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.104.gate_proj.weight": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.104.gate_proj.weight_scale": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.104.up_proj.weight": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.104.up_proj.weight_scale": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.105.down_proj.weight": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.105.down_proj.weight_scale": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.105.gate_proj.weight": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.105.gate_proj.weight_scale": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.105.up_proj.weight": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.105.up_proj.weight_scale": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.106.down_proj.weight": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.106.down_proj.weight_scale": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.106.gate_proj.weight": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.106.gate_proj.weight_scale": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.106.up_proj.weight": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.106.up_proj.weight_scale": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.107.down_proj.weight": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.107.down_proj.weight_scale": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.107.gate_proj.weight": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.107.gate_proj.weight_scale": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.107.up_proj.weight": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.107.up_proj.weight_scale": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.108.down_proj.weight": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.108.down_proj.weight_scale": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.108.gate_proj.weight": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.108.gate_proj.weight_scale": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.108.up_proj.weight": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.108.up_proj.weight_scale": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.109.down_proj.weight": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.109.down_proj.weight_scale": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.109.gate_proj.weight": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.109.gate_proj.weight_scale": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.109.up_proj.weight": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.109.up_proj.weight_scale": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.11.down_proj.weight": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.11.down_proj.weight_scale": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.11.gate_proj.weight": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.11.gate_proj.weight_scale": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.11.up_proj.weight": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.11.up_proj.weight_scale": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.110.down_proj.weight": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.110.down_proj.weight_scale": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.110.gate_proj.weight": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.110.gate_proj.weight_scale": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.110.up_proj.weight": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.110.up_proj.weight_scale": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.111.down_proj.weight": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.111.down_proj.weight_scale": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.111.gate_proj.weight": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.111.gate_proj.weight_scale": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.111.up_proj.weight": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.111.up_proj.weight_scale": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.112.down_proj.weight": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.112.down_proj.weight_scale": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.112.gate_proj.weight": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.112.gate_proj.weight_scale": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.112.up_proj.weight": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.112.up_proj.weight_scale": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.113.down_proj.weight": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.113.down_proj.weight_scale": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.113.gate_proj.weight": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.113.gate_proj.weight_scale": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.113.up_proj.weight": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.113.up_proj.weight_scale": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.114.down_proj.weight": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.114.down_proj.weight_scale": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.114.gate_proj.weight": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.114.gate_proj.weight_scale": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.114.up_proj.weight": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.114.up_proj.weight_scale": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.115.down_proj.weight": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.115.down_proj.weight_scale": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.115.gate_proj.weight": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.115.gate_proj.weight_scale": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.115.up_proj.weight": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.115.up_proj.weight_scale": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.116.down_proj.weight": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.116.down_proj.weight_scale": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.116.gate_proj.weight": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.116.gate_proj.weight_scale": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.116.up_proj.weight": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.116.up_proj.weight_scale": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.117.down_proj.weight": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.117.down_proj.weight_scale": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.117.gate_proj.weight": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.117.gate_proj.weight_scale": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.117.up_proj.weight": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.117.up_proj.weight_scale": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.118.down_proj.weight": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.118.down_proj.weight_scale": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.118.gate_proj.weight": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.118.gate_proj.weight_scale": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.118.up_proj.weight": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.118.up_proj.weight_scale": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.119.down_proj.weight": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.119.down_proj.weight_scale": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.119.gate_proj.weight": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.119.gate_proj.weight_scale": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.119.up_proj.weight": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.119.up_proj.weight_scale": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.12.down_proj.weight": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.12.down_proj.weight_scale": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.12.gate_proj.weight": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.12.gate_proj.weight_scale": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.12.up_proj.weight": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.12.up_proj.weight_scale": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.120.down_proj.weight": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.120.down_proj.weight_scale": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.120.gate_proj.weight": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.120.gate_proj.weight_scale": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.120.up_proj.weight": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.120.up_proj.weight_scale": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.121.down_proj.weight": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.121.down_proj.weight_scale": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.121.gate_proj.weight": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.121.gate_proj.weight_scale": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.121.up_proj.weight": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.121.up_proj.weight_scale": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.122.down_proj.weight": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.122.down_proj.weight_scale": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.122.gate_proj.weight": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.122.gate_proj.weight_scale": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.122.up_proj.weight": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.122.up_proj.weight_scale": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.123.down_proj.weight": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.123.down_proj.weight_scale": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.123.gate_proj.weight": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.123.gate_proj.weight_scale": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.123.up_proj.weight": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.123.up_proj.weight_scale": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.124.down_proj.weight": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.124.down_proj.weight_scale": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.124.gate_proj.weight": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.124.gate_proj.weight_scale": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.124.up_proj.weight": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.124.up_proj.weight_scale": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.125.down_proj.weight": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.125.down_proj.weight_scale": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.125.gate_proj.weight": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.125.gate_proj.weight_scale": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.125.up_proj.weight": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.125.up_proj.weight_scale": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.126.down_proj.weight": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.126.down_proj.weight_scale": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.126.gate_proj.weight": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.126.gate_proj.weight_scale": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.126.up_proj.weight": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.126.up_proj.weight_scale": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.127.down_proj.weight": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.127.down_proj.weight_scale": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.127.gate_proj.weight": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.127.gate_proj.weight_scale": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.127.up_proj.weight": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.127.up_proj.weight_scale": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.128.down_proj.weight": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.128.down_proj.weight_scale": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.128.gate_proj.weight": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.128.gate_proj.weight_scale": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.128.up_proj.weight": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.128.up_proj.weight_scale": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.129.down_proj.weight": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.129.down_proj.weight_scale": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.129.gate_proj.weight": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.129.gate_proj.weight_scale": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.129.up_proj.weight": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.129.up_proj.weight_scale": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.13.down_proj.weight": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.13.down_proj.weight_scale": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.13.gate_proj.weight": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.13.gate_proj.weight_scale": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.13.up_proj.weight": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.13.up_proj.weight_scale": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.130.down_proj.weight": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.130.down_proj.weight_scale": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.130.gate_proj.weight": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.130.gate_proj.weight_scale": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.130.up_proj.weight": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.130.up_proj.weight_scale": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.131.down_proj.weight": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.131.down_proj.weight_scale": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.131.gate_proj.weight": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.131.gate_proj.weight_scale": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.131.up_proj.weight": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.131.up_proj.weight_scale": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.132.down_proj.weight": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.132.down_proj.weight_scale": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.132.gate_proj.weight": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.132.gate_proj.weight_scale": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.132.up_proj.weight": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.132.up_proj.weight_scale": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.133.down_proj.weight": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.133.down_proj.weight_scale": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.133.gate_proj.weight": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.133.gate_proj.weight_scale": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.133.up_proj.weight": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.133.up_proj.weight_scale": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.134.down_proj.weight": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.134.down_proj.weight_scale": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.134.gate_proj.weight": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.134.gate_proj.weight_scale": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.134.up_proj.weight": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.134.up_proj.weight_scale": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.135.down_proj.weight": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.135.down_proj.weight_scale": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.135.gate_proj.weight": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.135.gate_proj.weight_scale": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.135.up_proj.weight": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.135.up_proj.weight_scale": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.136.down_proj.weight": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.136.down_proj.weight_scale": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.136.gate_proj.weight": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.136.gate_proj.weight_scale": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.136.up_proj.weight": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.136.up_proj.weight_scale": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.137.down_proj.weight": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.137.down_proj.weight_scale": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.137.gate_proj.weight": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.137.gate_proj.weight_scale": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.137.up_proj.weight": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.137.up_proj.weight_scale": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.138.down_proj.weight": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.138.down_proj.weight_scale": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.138.gate_proj.weight": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.138.gate_proj.weight_scale": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.138.up_proj.weight": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.138.up_proj.weight_scale": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.139.down_proj.weight": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.139.down_proj.weight_scale": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.139.gate_proj.weight": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.139.gate_proj.weight_scale": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.139.up_proj.weight": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.139.up_proj.weight_scale": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.14.down_proj.weight": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.14.down_proj.weight_scale": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.14.gate_proj.weight": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.14.gate_proj.weight_scale": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.14.up_proj.weight": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.14.up_proj.weight_scale": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.140.down_proj.weight": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.140.down_proj.weight_scale": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.140.gate_proj.weight": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.140.gate_proj.weight_scale": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.140.up_proj.weight": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.140.up_proj.weight_scale": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.141.down_proj.weight": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.141.down_proj.weight_scale": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.141.gate_proj.weight": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.141.gate_proj.weight_scale": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.141.up_proj.weight": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.141.up_proj.weight_scale": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.142.down_proj.weight": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.142.down_proj.weight_scale": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.142.gate_proj.weight": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.142.gate_proj.weight_scale": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.142.up_proj.weight": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.142.up_proj.weight_scale": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.143.down_proj.weight": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.143.down_proj.weight_scale": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.143.gate_proj.weight": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.143.gate_proj.weight_scale": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.143.up_proj.weight": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.143.up_proj.weight_scale": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.144.down_proj.weight": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.144.down_proj.weight_scale": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.144.gate_proj.weight": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.144.gate_proj.weight_scale": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.144.up_proj.weight": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.144.up_proj.weight_scale": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.145.down_proj.weight": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.145.down_proj.weight_scale": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.145.gate_proj.weight": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.145.gate_proj.weight_scale": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.145.up_proj.weight": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.145.up_proj.weight_scale": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.146.down_proj.weight": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.146.down_proj.weight_scale": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.146.gate_proj.weight": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.146.gate_proj.weight_scale": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.146.up_proj.weight": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.146.up_proj.weight_scale": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.147.down_proj.weight": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.147.down_proj.weight_scale": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.147.gate_proj.weight": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.147.gate_proj.weight_scale": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.147.up_proj.weight": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.147.up_proj.weight_scale": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.148.down_proj.weight": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.148.down_proj.weight_scale": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.148.gate_proj.weight": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.148.gate_proj.weight_scale": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.148.up_proj.weight": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.148.up_proj.weight_scale": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.149.down_proj.weight": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.149.down_proj.weight_scale": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.149.gate_proj.weight": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.149.gate_proj.weight_scale": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.149.up_proj.weight": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.149.up_proj.weight_scale": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.15.down_proj.weight": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.15.down_proj.weight_scale": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.15.gate_proj.weight": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.15.gate_proj.weight_scale": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.15.up_proj.weight": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.15.up_proj.weight_scale": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.150.down_proj.weight": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.150.down_proj.weight_scale": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.150.gate_proj.weight": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.150.gate_proj.weight_scale": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.150.up_proj.weight": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.150.up_proj.weight_scale": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.151.down_proj.weight": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.151.down_proj.weight_scale": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.151.gate_proj.weight": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.151.gate_proj.weight_scale": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.151.up_proj.weight": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.151.up_proj.weight_scale": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.152.down_proj.weight": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.152.down_proj.weight_scale": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.152.gate_proj.weight": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.152.gate_proj.weight_scale": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.152.up_proj.weight": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.152.up_proj.weight_scale": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.153.down_proj.weight": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.153.down_proj.weight_scale": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.153.gate_proj.weight": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.153.gate_proj.weight_scale": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.153.up_proj.weight": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.153.up_proj.weight_scale": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.154.down_proj.weight": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.154.down_proj.weight_scale": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.154.gate_proj.weight": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.154.gate_proj.weight_scale": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.154.up_proj.weight": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.154.up_proj.weight_scale": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.155.down_proj.weight": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.155.down_proj.weight_scale": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.155.gate_proj.weight": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.155.gate_proj.weight_scale": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.155.up_proj.weight": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.155.up_proj.weight_scale": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.156.down_proj.weight": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.156.down_proj.weight_scale": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.156.gate_proj.weight": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.156.gate_proj.weight_scale": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.156.up_proj.weight": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.156.up_proj.weight_scale": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.157.down_proj.weight": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.157.down_proj.weight_scale": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.157.gate_proj.weight": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.157.gate_proj.weight_scale": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.157.up_proj.weight": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.157.up_proj.weight_scale": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.158.down_proj.weight": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.158.down_proj.weight_scale": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.158.gate_proj.weight": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.158.gate_proj.weight_scale": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.158.up_proj.weight": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.158.up_proj.weight_scale": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.159.down_proj.weight": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.159.down_proj.weight_scale": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.159.gate_proj.weight": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.159.gate_proj.weight_scale": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.159.up_proj.weight": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.159.up_proj.weight_scale": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.16.down_proj.weight": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.16.down_proj.weight_scale": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.16.gate_proj.weight": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.16.gate_proj.weight_scale": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.16.up_proj.weight": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.16.up_proj.weight_scale": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.17.down_proj.weight": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.17.down_proj.weight_scale": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.17.gate_proj.weight": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.17.gate_proj.weight_scale": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.17.up_proj.weight": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.17.up_proj.weight_scale": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.18.down_proj.weight": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.18.down_proj.weight_scale": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.18.gate_proj.weight": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.18.gate_proj.weight_scale": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.18.up_proj.weight": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.18.up_proj.weight_scale": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.19.down_proj.weight": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.19.down_proj.weight_scale": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.19.gate_proj.weight": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.19.gate_proj.weight_scale": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.19.up_proj.weight": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.19.up_proj.weight_scale": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.2.down_proj.weight": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.2.down_proj.weight_scale": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.2.gate_proj.weight": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.2.gate_proj.weight_scale": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.2.up_proj.weight": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.2.up_proj.weight_scale": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.20.down_proj.weight": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.20.down_proj.weight_scale": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.20.gate_proj.weight": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.20.gate_proj.weight_scale": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.20.up_proj.weight": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.20.up_proj.weight_scale": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.21.down_proj.weight": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.21.down_proj.weight_scale": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.21.gate_proj.weight": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.21.gate_proj.weight_scale": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.21.up_proj.weight": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.21.up_proj.weight_scale": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.22.down_proj.weight": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.22.down_proj.weight_scale": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.22.gate_proj.weight": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.22.gate_proj.weight_scale": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.22.up_proj.weight": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.22.up_proj.weight_scale": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.23.down_proj.weight": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.23.down_proj.weight_scale": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.23.gate_proj.weight": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.23.gate_proj.weight_scale": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.23.up_proj.weight": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.23.up_proj.weight_scale": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.24.down_proj.weight": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.24.down_proj.weight_scale": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.24.gate_proj.weight": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.24.gate_proj.weight_scale": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.24.up_proj.weight": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.24.up_proj.weight_scale": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.25.down_proj.weight": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.25.down_proj.weight_scale": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.25.gate_proj.weight": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.25.gate_proj.weight_scale": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.25.up_proj.weight": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.25.up_proj.weight_scale": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.26.down_proj.weight": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.26.down_proj.weight_scale": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.26.gate_proj.weight": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.26.gate_proj.weight_scale": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.26.up_proj.weight": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.26.up_proj.weight_scale": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.27.down_proj.weight": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.27.down_proj.weight_scale": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.27.gate_proj.weight": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.27.gate_proj.weight_scale": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.27.up_proj.weight": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.27.up_proj.weight_scale": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.28.down_proj.weight": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.28.down_proj.weight_scale": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.28.gate_proj.weight": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.28.gate_proj.weight_scale": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.28.up_proj.weight": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.28.up_proj.weight_scale": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.29.down_proj.weight": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.29.down_proj.weight_scale": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.29.gate_proj.weight": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.29.gate_proj.weight_scale": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.29.up_proj.weight": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.29.up_proj.weight_scale": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.3.down_proj.weight": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.3.down_proj.weight_scale": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.3.gate_proj.weight": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.3.gate_proj.weight_scale": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.3.up_proj.weight": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.3.up_proj.weight_scale": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.30.down_proj.weight": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.30.down_proj.weight_scale": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.30.gate_proj.weight": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.30.gate_proj.weight_scale": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.30.up_proj.weight": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.30.up_proj.weight_scale": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.31.down_proj.weight": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.31.down_proj.weight_scale": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.31.gate_proj.weight": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.31.gate_proj.weight_scale": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.31.up_proj.weight": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.31.up_proj.weight_scale": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.32.down_proj.weight": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.32.down_proj.weight_scale": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.32.gate_proj.weight": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.32.gate_proj.weight_scale": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.32.up_proj.weight": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.32.up_proj.weight_scale": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.33.down_proj.weight": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.33.down_proj.weight_scale": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.33.gate_proj.weight": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.33.gate_proj.weight_scale": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.33.up_proj.weight": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.33.up_proj.weight_scale": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.34.down_proj.weight": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.34.down_proj.weight_scale": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.34.gate_proj.weight": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.34.gate_proj.weight_scale": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.34.up_proj.weight": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.34.up_proj.weight_scale": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.35.down_proj.weight": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.35.down_proj.weight_scale": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.35.gate_proj.weight": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.35.gate_proj.weight_scale": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.35.up_proj.weight": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.35.up_proj.weight_scale": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.36.down_proj.weight": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.36.down_proj.weight_scale": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.36.gate_proj.weight": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.36.gate_proj.weight_scale": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.36.up_proj.weight": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.36.up_proj.weight_scale": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.37.down_proj.weight": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.37.down_proj.weight_scale": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.37.gate_proj.weight": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.37.gate_proj.weight_scale": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.37.up_proj.weight": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.37.up_proj.weight_scale": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.38.down_proj.weight": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.38.down_proj.weight_scale": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.38.gate_proj.weight": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.38.gate_proj.weight_scale": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.38.up_proj.weight": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.38.up_proj.weight_scale": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.39.down_proj.weight": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.39.down_proj.weight_scale": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.39.gate_proj.weight": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.39.gate_proj.weight_scale": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.39.up_proj.weight": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.39.up_proj.weight_scale": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.4.down_proj.weight": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.4.down_proj.weight_scale": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.4.gate_proj.weight": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.4.gate_proj.weight_scale": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.4.up_proj.weight": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.4.up_proj.weight_scale": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.40.down_proj.weight": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.40.down_proj.weight_scale": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.40.gate_proj.weight": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.40.gate_proj.weight_scale": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.40.up_proj.weight": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.40.up_proj.weight_scale": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.41.down_proj.weight": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.41.down_proj.weight_scale": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.41.gate_proj.weight": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.41.gate_proj.weight_scale": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.41.up_proj.weight": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.41.up_proj.weight_scale": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.42.down_proj.weight": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.42.down_proj.weight_scale": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.42.gate_proj.weight": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.42.gate_proj.weight_scale": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.42.up_proj.weight": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.42.up_proj.weight_scale": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.43.down_proj.weight": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.43.down_proj.weight_scale": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.43.gate_proj.weight": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.43.gate_proj.weight_scale": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.43.up_proj.weight": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.43.up_proj.weight_scale": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.44.down_proj.weight": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.44.down_proj.weight_scale": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.44.gate_proj.weight": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.44.gate_proj.weight_scale": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.44.up_proj.weight": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.44.up_proj.weight_scale": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.45.down_proj.weight": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.45.down_proj.weight_scale": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.45.gate_proj.weight": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.45.gate_proj.weight_scale": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.45.up_proj.weight": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.45.up_proj.weight_scale": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.46.down_proj.weight": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.46.down_proj.weight_scale": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.46.gate_proj.weight": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.46.gate_proj.weight_scale": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.46.up_proj.weight": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.46.up_proj.weight_scale": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.47.down_proj.weight": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.47.down_proj.weight_scale": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.47.gate_proj.weight": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.47.gate_proj.weight_scale": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.47.up_proj.weight": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.47.up_proj.weight_scale": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.48.down_proj.weight": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.48.down_proj.weight_scale": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.48.gate_proj.weight": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.48.gate_proj.weight_scale": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.48.up_proj.weight": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.48.up_proj.weight_scale": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.49.down_proj.weight": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.49.down_proj.weight_scale": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.49.gate_proj.weight": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.49.gate_proj.weight_scale": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.49.up_proj.weight": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.49.up_proj.weight_scale": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.5.down_proj.weight": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.5.down_proj.weight_scale": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.5.gate_proj.weight": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.5.gate_proj.weight_scale": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.5.up_proj.weight": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.5.up_proj.weight_scale": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.50.down_proj.weight": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.50.down_proj.weight_scale": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.50.gate_proj.weight": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.50.gate_proj.weight_scale": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.50.up_proj.weight": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.50.up_proj.weight_scale": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.51.down_proj.weight": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.51.down_proj.weight_scale": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.51.gate_proj.weight": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.51.gate_proj.weight_scale": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.51.up_proj.weight": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.51.up_proj.weight_scale": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.52.down_proj.weight": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.52.down_proj.weight_scale": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.52.gate_proj.weight": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.52.gate_proj.weight_scale": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.52.up_proj.weight": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.52.up_proj.weight_scale": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.53.down_proj.weight": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.53.down_proj.weight_scale": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.53.gate_proj.weight": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.53.gate_proj.weight_scale": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.53.up_proj.weight": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.53.up_proj.weight_scale": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.54.down_proj.weight": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.54.down_proj.weight_scale": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.54.gate_proj.weight": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.54.gate_proj.weight_scale": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.54.up_proj.weight": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.54.up_proj.weight_scale": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.55.down_proj.weight": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.55.down_proj.weight_scale": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.55.gate_proj.weight": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.55.gate_proj.weight_scale": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.55.up_proj.weight": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.55.up_proj.weight_scale": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.56.down_proj.weight": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.56.down_proj.weight_scale": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.56.gate_proj.weight": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.56.gate_proj.weight_scale": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.56.up_proj.weight": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.56.up_proj.weight_scale": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.57.down_proj.weight": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.57.down_proj.weight_scale": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.57.gate_proj.weight": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.57.gate_proj.weight_scale": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.57.up_proj.weight": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.57.up_proj.weight_scale": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.58.down_proj.weight": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.58.down_proj.weight_scale": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.58.gate_proj.weight": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.58.gate_proj.weight_scale": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.58.up_proj.weight": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.58.up_proj.weight_scale": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.59.down_proj.weight": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.59.down_proj.weight_scale": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.59.gate_proj.weight": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.59.gate_proj.weight_scale": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.59.up_proj.weight": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.59.up_proj.weight_scale": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.6.down_proj.weight": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.6.down_proj.weight_scale": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.6.gate_proj.weight": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.6.gate_proj.weight_scale": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.6.up_proj.weight": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.6.up_proj.weight_scale": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.60.down_proj.weight": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.60.down_proj.weight_scale": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.60.gate_proj.weight": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.60.gate_proj.weight_scale": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.60.up_proj.weight": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.60.up_proj.weight_scale": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.61.down_proj.weight": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.61.down_proj.weight_scale": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.61.gate_proj.weight": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.61.gate_proj.weight_scale": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.61.up_proj.weight": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.61.up_proj.weight_scale": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.62.down_proj.weight": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.62.down_proj.weight_scale": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.62.gate_proj.weight": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.62.gate_proj.weight_scale": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.62.up_proj.weight": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.62.up_proj.weight_scale": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.63.down_proj.weight": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.63.down_proj.weight_scale": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.63.gate_proj.weight": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.63.gate_proj.weight_scale": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.63.up_proj.weight": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.63.up_proj.weight_scale": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.64.down_proj.weight": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.64.down_proj.weight_scale": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.64.gate_proj.weight": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.64.gate_proj.weight_scale": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.64.up_proj.weight": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.64.up_proj.weight_scale": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.65.down_proj.weight": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.65.down_proj.weight_scale": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.65.gate_proj.weight": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.65.gate_proj.weight_scale": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.65.up_proj.weight": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.65.up_proj.weight_scale": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.66.down_proj.weight": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.66.down_proj.weight_scale": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.66.gate_proj.weight": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.66.gate_proj.weight_scale": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.66.up_proj.weight": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.66.up_proj.weight_scale": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.67.down_proj.weight": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.67.down_proj.weight_scale": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.67.gate_proj.weight": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.67.gate_proj.weight_scale": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.67.up_proj.weight": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.67.up_proj.weight_scale": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.68.down_proj.weight": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.68.down_proj.weight_scale": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.68.gate_proj.weight": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.68.gate_proj.weight_scale": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.68.up_proj.weight": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.68.up_proj.weight_scale": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.69.down_proj.weight": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.69.down_proj.weight_scale": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.69.gate_proj.weight": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.69.gate_proj.weight_scale": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.69.up_proj.weight": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.69.up_proj.weight_scale": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.7.down_proj.weight": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.7.down_proj.weight_scale": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.7.gate_proj.weight": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.7.gate_proj.weight_scale": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.7.up_proj.weight": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.7.up_proj.weight_scale": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.70.down_proj.weight": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.70.down_proj.weight_scale": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.70.gate_proj.weight": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.70.gate_proj.weight_scale": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.70.up_proj.weight": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.70.up_proj.weight_scale": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.71.down_proj.weight": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.71.down_proj.weight_scale": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.71.gate_proj.weight": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.71.gate_proj.weight_scale": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.71.up_proj.weight": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.71.up_proj.weight_scale": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.72.down_proj.weight": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.72.down_proj.weight_scale": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.72.gate_proj.weight": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.72.gate_proj.weight_scale": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.72.up_proj.weight": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.72.up_proj.weight_scale": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.73.down_proj.weight": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.73.down_proj.weight_scale": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.73.gate_proj.weight": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.73.gate_proj.weight_scale": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.73.up_proj.weight": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.73.up_proj.weight_scale": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.74.down_proj.weight": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.74.down_proj.weight_scale": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.74.gate_proj.weight": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.74.gate_proj.weight_scale": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.74.up_proj.weight": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.74.up_proj.weight_scale": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.75.down_proj.weight": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.75.down_proj.weight_scale": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.75.gate_proj.weight": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.75.gate_proj.weight_scale": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.75.up_proj.weight": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.75.up_proj.weight_scale": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.76.down_proj.weight": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.76.down_proj.weight_scale": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.76.gate_proj.weight": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.76.gate_proj.weight_scale": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.76.up_proj.weight": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.76.up_proj.weight_scale": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.77.down_proj.weight": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.77.down_proj.weight_scale": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.77.gate_proj.weight": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.77.gate_proj.weight_scale": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.77.up_proj.weight": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.77.up_proj.weight_scale": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.78.down_proj.weight": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.78.down_proj.weight_scale": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.78.gate_proj.weight": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.78.gate_proj.weight_scale": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.78.up_proj.weight": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.78.up_proj.weight_scale": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.79.down_proj.weight": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.79.down_proj.weight_scale": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.79.gate_proj.weight": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.79.gate_proj.weight_scale": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.79.up_proj.weight": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.79.up_proj.weight_scale": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.8.down_proj.weight": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.8.down_proj.weight_scale": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.8.gate_proj.weight": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.8.gate_proj.weight_scale": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.8.up_proj.weight": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.8.up_proj.weight_scale": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.80.down_proj.weight": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.80.down_proj.weight_scale": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.80.gate_proj.weight": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.80.gate_proj.weight_scale": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.80.up_proj.weight": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.80.up_proj.weight_scale": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.81.down_proj.weight": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.81.down_proj.weight_scale": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.81.gate_proj.weight": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.81.gate_proj.weight_scale": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.81.up_proj.weight": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.81.up_proj.weight_scale": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.82.down_proj.weight": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.82.down_proj.weight_scale": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.82.gate_proj.weight": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.82.gate_proj.weight_scale": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.82.up_proj.weight": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.82.up_proj.weight_scale": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.83.down_proj.weight": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.83.down_proj.weight_scale": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.83.gate_proj.weight": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.83.gate_proj.weight_scale": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.83.up_proj.weight": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.83.up_proj.weight_scale": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.84.down_proj.weight": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.84.down_proj.weight_scale": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.84.gate_proj.weight": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.84.gate_proj.weight_scale": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.84.up_proj.weight": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.84.up_proj.weight_scale": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.85.down_proj.weight": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.85.down_proj.weight_scale": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.85.gate_proj.weight": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.85.gate_proj.weight_scale": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.85.up_proj.weight": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.85.up_proj.weight_scale": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.86.down_proj.weight": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.86.down_proj.weight_scale": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.86.gate_proj.weight": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.86.gate_proj.weight_scale": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.86.up_proj.weight": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.86.up_proj.weight_scale": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.87.down_proj.weight": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.87.down_proj.weight_scale": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.87.gate_proj.weight": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.87.gate_proj.weight_scale": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.87.up_proj.weight": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.87.up_proj.weight_scale": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.88.down_proj.weight": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.88.down_proj.weight_scale": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.88.gate_proj.weight": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.88.gate_proj.weight_scale": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.88.up_proj.weight": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.88.up_proj.weight_scale": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.89.down_proj.weight": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.89.down_proj.weight_scale": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.89.gate_proj.weight": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.89.gate_proj.weight_scale": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.89.up_proj.weight": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.89.up_proj.weight_scale": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.9.down_proj.weight": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.9.down_proj.weight_scale": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.9.gate_proj.weight": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.9.gate_proj.weight_scale": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.9.up_proj.weight": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.9.up_proj.weight_scale": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.90.down_proj.weight": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.90.down_proj.weight_scale": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.90.gate_proj.weight": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.90.gate_proj.weight_scale": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.90.up_proj.weight": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.90.up_proj.weight_scale": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.91.down_proj.weight": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.91.down_proj.weight_scale": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.91.gate_proj.weight": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.91.gate_proj.weight_scale": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.91.up_proj.weight": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.91.up_proj.weight_scale": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.92.down_proj.weight": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.92.down_proj.weight_scale": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.92.gate_proj.weight": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.92.gate_proj.weight_scale": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.92.up_proj.weight": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.92.up_proj.weight_scale": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.93.down_proj.weight": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.93.down_proj.weight_scale": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.93.gate_proj.weight": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.93.gate_proj.weight_scale": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.93.up_proj.weight": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.93.up_proj.weight_scale": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.94.down_proj.weight": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.94.down_proj.weight_scale": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.94.gate_proj.weight": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.94.gate_proj.weight_scale": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.94.up_proj.weight": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.94.up_proj.weight_scale": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.95.down_proj.weight": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.95.down_proj.weight_scale": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.95.gate_proj.weight": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.95.gate_proj.weight_scale": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.95.up_proj.weight": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.95.up_proj.weight_scale": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.96.down_proj.weight": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.96.down_proj.weight_scale": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.96.gate_proj.weight": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.96.gate_proj.weight_scale": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.96.up_proj.weight": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.96.up_proj.weight_scale": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.97.down_proj.weight": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.97.down_proj.weight_scale": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.97.gate_proj.weight": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.97.gate_proj.weight_scale": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.97.up_proj.weight": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.97.up_proj.weight_scale": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.98.down_proj.weight": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.98.down_proj.weight_scale": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.98.gate_proj.weight": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.98.gate_proj.weight_scale": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.98.up_proj.weight": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.98.up_proj.weight_scale": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.99.down_proj.weight": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.99.down_proj.weight_scale": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.99.gate_proj.weight": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.99.gate_proj.weight_scale": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.99.up_proj.weight": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.99.up_proj.weight_scale": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.gate.e_score_correction_bias": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.gate.weight": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.shared_experts.down_proj.weight": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.shared_experts.down_proj.weight_scale": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.shared_experts.gate_proj.weight": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.shared_experts.gate_proj.weight_scale": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.shared_experts.up_proj.weight": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.shared_experts.up_proj.weight_scale": "model-00090-of-00092.safetensors",
+ "model.layers.89.post_attention_layernorm.weight": "model-00090-of-00092.safetensors",
+ "model.layers.89.self_attn.k_norm.weight": "model-00090-of-00092.safetensors",
+ "model.layers.89.self_attn.k_proj.bias": "model-00090-of-00092.safetensors",
+ "model.layers.89.self_attn.k_proj.weight": "model-00090-of-00092.safetensors",
+ "model.layers.89.self_attn.k_proj.weight_scale": "model-00090-of-00092.safetensors",
+ "model.layers.89.self_attn.o_proj.weight": "model-00090-of-00092.safetensors",
+ "model.layers.89.self_attn.o_proj.weight_scale": "model-00090-of-00092.safetensors",
+ "model.layers.89.self_attn.q_norm.weight": "model-00090-of-00092.safetensors",
+ "model.layers.89.self_attn.q_proj.bias": "model-00090-of-00092.safetensors",
+ "model.layers.89.self_attn.q_proj.weight": "model-00090-of-00092.safetensors",
+ "model.layers.89.self_attn.q_proj.weight_scale": "model-00090-of-00092.safetensors",
+ "model.layers.89.self_attn.v_proj.bias": "model-00090-of-00092.safetensors",
+ "model.layers.89.self_attn.v_proj.weight": "model-00090-of-00092.safetensors",
+ "model.layers.89.self_attn.v_proj.weight_scale": "model-00090-of-00092.safetensors",
+ "model.layers.90.input_layernorm.weight": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.0.down_proj.weight": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.0.down_proj.weight_scale": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.0.gate_proj.weight": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.0.gate_proj.weight_scale": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.0.up_proj.weight": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.0.up_proj.weight_scale": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.1.down_proj.weight": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.1.down_proj.weight_scale": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.1.gate_proj.weight": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.1.gate_proj.weight_scale": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.1.up_proj.weight": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.1.up_proj.weight_scale": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.10.down_proj.weight": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.10.down_proj.weight_scale": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.10.gate_proj.weight": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.10.gate_proj.weight_scale": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.10.up_proj.weight": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.10.up_proj.weight_scale": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.100.down_proj.weight": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.100.down_proj.weight_scale": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.100.gate_proj.weight": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.100.gate_proj.weight_scale": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.100.up_proj.weight": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.100.up_proj.weight_scale": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.101.down_proj.weight": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.101.down_proj.weight_scale": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.101.gate_proj.weight": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.101.gate_proj.weight_scale": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.101.up_proj.weight": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.101.up_proj.weight_scale": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.102.down_proj.weight": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.102.down_proj.weight_scale": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.102.gate_proj.weight": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.102.gate_proj.weight_scale": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.102.up_proj.weight": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.102.up_proj.weight_scale": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.103.down_proj.weight": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.103.down_proj.weight_scale": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.103.gate_proj.weight": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.103.gate_proj.weight_scale": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.103.up_proj.weight": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.103.up_proj.weight_scale": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.104.down_proj.weight": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.104.down_proj.weight_scale": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.104.gate_proj.weight": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.104.gate_proj.weight_scale": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.104.up_proj.weight": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.104.up_proj.weight_scale": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.105.down_proj.weight": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.105.down_proj.weight_scale": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.105.gate_proj.weight": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.105.gate_proj.weight_scale": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.105.up_proj.weight": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.105.up_proj.weight_scale": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.106.down_proj.weight": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.106.down_proj.weight_scale": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.106.gate_proj.weight": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.106.gate_proj.weight_scale": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.106.up_proj.weight": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.106.up_proj.weight_scale": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.107.down_proj.weight": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.107.down_proj.weight_scale": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.107.gate_proj.weight": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.107.gate_proj.weight_scale": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.107.up_proj.weight": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.107.up_proj.weight_scale": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.108.down_proj.weight": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.108.down_proj.weight_scale": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.108.gate_proj.weight": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.108.gate_proj.weight_scale": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.108.up_proj.weight": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.108.up_proj.weight_scale": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.109.down_proj.weight": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.109.down_proj.weight_scale": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.109.gate_proj.weight": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.109.gate_proj.weight_scale": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.109.up_proj.weight": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.109.up_proj.weight_scale": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.11.down_proj.weight": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.11.down_proj.weight_scale": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.11.gate_proj.weight": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.11.gate_proj.weight_scale": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.11.up_proj.weight": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.11.up_proj.weight_scale": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.110.down_proj.weight": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.110.down_proj.weight_scale": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.110.gate_proj.weight": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.110.gate_proj.weight_scale": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.110.up_proj.weight": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.110.up_proj.weight_scale": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.111.down_proj.weight": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.111.down_proj.weight_scale": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.111.gate_proj.weight": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.111.gate_proj.weight_scale": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.111.up_proj.weight": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.111.up_proj.weight_scale": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.112.down_proj.weight": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.112.down_proj.weight_scale": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.112.gate_proj.weight": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.112.gate_proj.weight_scale": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.112.up_proj.weight": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.112.up_proj.weight_scale": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.113.down_proj.weight": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.113.down_proj.weight_scale": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.113.gate_proj.weight": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.113.gate_proj.weight_scale": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.113.up_proj.weight": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.113.up_proj.weight_scale": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.114.down_proj.weight": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.114.down_proj.weight_scale": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.114.gate_proj.weight": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.114.gate_proj.weight_scale": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.114.up_proj.weight": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.114.up_proj.weight_scale": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.115.down_proj.weight": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.115.down_proj.weight_scale": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.115.gate_proj.weight": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.115.gate_proj.weight_scale": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.115.up_proj.weight": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.115.up_proj.weight_scale": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.116.down_proj.weight": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.116.down_proj.weight_scale": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.116.gate_proj.weight": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.116.gate_proj.weight_scale": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.116.up_proj.weight": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.116.up_proj.weight_scale": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.117.down_proj.weight": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.117.down_proj.weight_scale": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.117.gate_proj.weight": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.117.gate_proj.weight_scale": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.117.up_proj.weight": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.117.up_proj.weight_scale": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.118.down_proj.weight": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.118.down_proj.weight_scale": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.118.gate_proj.weight": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.118.gate_proj.weight_scale": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.118.up_proj.weight": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.118.up_proj.weight_scale": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.119.down_proj.weight": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.119.down_proj.weight_scale": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.119.gate_proj.weight": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.119.gate_proj.weight_scale": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.119.up_proj.weight": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.119.up_proj.weight_scale": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.12.down_proj.weight": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.12.down_proj.weight_scale": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.12.gate_proj.weight": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.12.gate_proj.weight_scale": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.12.up_proj.weight": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.12.up_proj.weight_scale": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.120.down_proj.weight": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.120.down_proj.weight_scale": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.120.gate_proj.weight": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.120.gate_proj.weight_scale": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.120.up_proj.weight": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.120.up_proj.weight_scale": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.121.down_proj.weight": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.121.down_proj.weight_scale": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.121.gate_proj.weight": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.121.gate_proj.weight_scale": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.121.up_proj.weight": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.121.up_proj.weight_scale": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.122.down_proj.weight": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.122.down_proj.weight_scale": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.122.gate_proj.weight": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.122.gate_proj.weight_scale": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.122.up_proj.weight": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.122.up_proj.weight_scale": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.123.down_proj.weight": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.123.down_proj.weight_scale": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.123.gate_proj.weight": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.123.gate_proj.weight_scale": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.123.up_proj.weight": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.123.up_proj.weight_scale": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.124.down_proj.weight": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.124.down_proj.weight_scale": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.124.gate_proj.weight": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.124.gate_proj.weight_scale": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.124.up_proj.weight": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.124.up_proj.weight_scale": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.125.down_proj.weight": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.125.down_proj.weight_scale": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.125.gate_proj.weight": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.125.gate_proj.weight_scale": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.125.up_proj.weight": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.125.up_proj.weight_scale": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.126.down_proj.weight": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.126.down_proj.weight_scale": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.126.gate_proj.weight": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.126.gate_proj.weight_scale": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.126.up_proj.weight": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.126.up_proj.weight_scale": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.127.down_proj.weight": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.127.down_proj.weight_scale": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.127.gate_proj.weight": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.127.gate_proj.weight_scale": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.127.up_proj.weight": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.127.up_proj.weight_scale": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.128.down_proj.weight": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.128.down_proj.weight_scale": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.128.gate_proj.weight": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.128.gate_proj.weight_scale": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.128.up_proj.weight": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.128.up_proj.weight_scale": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.129.down_proj.weight": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.129.down_proj.weight_scale": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.129.gate_proj.weight": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.129.gate_proj.weight_scale": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.129.up_proj.weight": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.129.up_proj.weight_scale": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.13.down_proj.weight": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.13.down_proj.weight_scale": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.13.gate_proj.weight": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.13.gate_proj.weight_scale": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.13.up_proj.weight": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.13.up_proj.weight_scale": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.130.down_proj.weight": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.130.down_proj.weight_scale": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.130.gate_proj.weight": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.130.gate_proj.weight_scale": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.130.up_proj.weight": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.130.up_proj.weight_scale": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.131.down_proj.weight": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.131.down_proj.weight_scale": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.131.gate_proj.weight": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.131.gate_proj.weight_scale": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.131.up_proj.weight": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.131.up_proj.weight_scale": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.132.down_proj.weight": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.132.down_proj.weight_scale": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.132.gate_proj.weight": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.132.gate_proj.weight_scale": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.132.up_proj.weight": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.132.up_proj.weight_scale": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.133.down_proj.weight": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.133.down_proj.weight_scale": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.133.gate_proj.weight": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.133.gate_proj.weight_scale": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.133.up_proj.weight": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.133.up_proj.weight_scale": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.134.down_proj.weight": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.134.down_proj.weight_scale": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.134.gate_proj.weight": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.134.gate_proj.weight_scale": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.134.up_proj.weight": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.134.up_proj.weight_scale": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.135.down_proj.weight": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.135.down_proj.weight_scale": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.135.gate_proj.weight": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.135.gate_proj.weight_scale": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.135.up_proj.weight": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.135.up_proj.weight_scale": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.136.down_proj.weight": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.136.down_proj.weight_scale": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.136.gate_proj.weight": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.136.gate_proj.weight_scale": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.136.up_proj.weight": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.136.up_proj.weight_scale": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.137.down_proj.weight": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.137.down_proj.weight_scale": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.137.gate_proj.weight": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.137.gate_proj.weight_scale": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.137.up_proj.weight": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.137.up_proj.weight_scale": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.138.down_proj.weight": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.138.down_proj.weight_scale": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.138.gate_proj.weight": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.138.gate_proj.weight_scale": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.138.up_proj.weight": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.138.up_proj.weight_scale": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.139.down_proj.weight": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.139.down_proj.weight_scale": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.139.gate_proj.weight": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.139.gate_proj.weight_scale": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.139.up_proj.weight": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.139.up_proj.weight_scale": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.14.down_proj.weight": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.14.down_proj.weight_scale": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.14.gate_proj.weight": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.14.gate_proj.weight_scale": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.14.up_proj.weight": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.14.up_proj.weight_scale": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.140.down_proj.weight": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.140.down_proj.weight_scale": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.140.gate_proj.weight": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.140.gate_proj.weight_scale": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.140.up_proj.weight": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.140.up_proj.weight_scale": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.141.down_proj.weight": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.141.down_proj.weight_scale": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.141.gate_proj.weight": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.141.gate_proj.weight_scale": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.141.up_proj.weight": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.141.up_proj.weight_scale": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.142.down_proj.weight": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.142.down_proj.weight_scale": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.142.gate_proj.weight": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.142.gate_proj.weight_scale": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.142.up_proj.weight": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.142.up_proj.weight_scale": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.143.down_proj.weight": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.143.down_proj.weight_scale": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.143.gate_proj.weight": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.143.gate_proj.weight_scale": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.143.up_proj.weight": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.143.up_proj.weight_scale": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.144.down_proj.weight": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.144.down_proj.weight_scale": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.144.gate_proj.weight": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.144.gate_proj.weight_scale": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.144.up_proj.weight": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.144.up_proj.weight_scale": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.145.down_proj.weight": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.145.down_proj.weight_scale": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.145.gate_proj.weight": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.145.gate_proj.weight_scale": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.145.up_proj.weight": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.145.up_proj.weight_scale": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.146.down_proj.weight": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.146.down_proj.weight_scale": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.146.gate_proj.weight": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.146.gate_proj.weight_scale": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.146.up_proj.weight": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.146.up_proj.weight_scale": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.147.down_proj.weight": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.147.down_proj.weight_scale": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.147.gate_proj.weight": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.147.gate_proj.weight_scale": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.147.up_proj.weight": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.147.up_proj.weight_scale": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.148.down_proj.weight": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.148.down_proj.weight_scale": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.148.gate_proj.weight": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.148.gate_proj.weight_scale": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.148.up_proj.weight": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.148.up_proj.weight_scale": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.149.down_proj.weight": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.149.down_proj.weight_scale": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.149.gate_proj.weight": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.149.gate_proj.weight_scale": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.149.up_proj.weight": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.149.up_proj.weight_scale": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.15.down_proj.weight": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.15.down_proj.weight_scale": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.15.gate_proj.weight": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.15.gate_proj.weight_scale": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.15.up_proj.weight": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.15.up_proj.weight_scale": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.150.down_proj.weight": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.150.down_proj.weight_scale": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.150.gate_proj.weight": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.150.gate_proj.weight_scale": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.150.up_proj.weight": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.150.up_proj.weight_scale": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.151.down_proj.weight": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.151.down_proj.weight_scale": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.151.gate_proj.weight": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.151.gate_proj.weight_scale": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.151.up_proj.weight": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.151.up_proj.weight_scale": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.152.down_proj.weight": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.152.down_proj.weight_scale": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.152.gate_proj.weight": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.152.gate_proj.weight_scale": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.152.up_proj.weight": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.152.up_proj.weight_scale": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.153.down_proj.weight": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.153.down_proj.weight_scale": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.153.gate_proj.weight": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.153.gate_proj.weight_scale": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.153.up_proj.weight": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.153.up_proj.weight_scale": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.154.down_proj.weight": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.154.down_proj.weight_scale": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.154.gate_proj.weight": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.154.gate_proj.weight_scale": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.154.up_proj.weight": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.154.up_proj.weight_scale": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.155.down_proj.weight": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.155.down_proj.weight_scale": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.155.gate_proj.weight": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.155.gate_proj.weight_scale": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.155.up_proj.weight": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.155.up_proj.weight_scale": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.156.down_proj.weight": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.156.down_proj.weight_scale": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.156.gate_proj.weight": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.156.gate_proj.weight_scale": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.156.up_proj.weight": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.156.up_proj.weight_scale": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.157.down_proj.weight": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.157.down_proj.weight_scale": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.157.gate_proj.weight": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.157.gate_proj.weight_scale": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.157.up_proj.weight": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.157.up_proj.weight_scale": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.158.down_proj.weight": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.158.down_proj.weight_scale": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.158.gate_proj.weight": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.158.gate_proj.weight_scale": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.158.up_proj.weight": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.158.up_proj.weight_scale": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.159.down_proj.weight": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.159.down_proj.weight_scale": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.159.gate_proj.weight": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.159.gate_proj.weight_scale": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.159.up_proj.weight": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.159.up_proj.weight_scale": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.16.down_proj.weight": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.16.down_proj.weight_scale": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.16.gate_proj.weight": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.16.gate_proj.weight_scale": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.16.up_proj.weight": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.16.up_proj.weight_scale": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.17.down_proj.weight": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.17.down_proj.weight_scale": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.17.gate_proj.weight": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.17.gate_proj.weight_scale": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.17.up_proj.weight": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.17.up_proj.weight_scale": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.18.down_proj.weight": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.18.down_proj.weight_scale": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.18.gate_proj.weight": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.18.gate_proj.weight_scale": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.18.up_proj.weight": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.18.up_proj.weight_scale": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.19.down_proj.weight": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.19.down_proj.weight_scale": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.19.gate_proj.weight": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.19.gate_proj.weight_scale": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.19.up_proj.weight": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.19.up_proj.weight_scale": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.2.down_proj.weight": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.2.down_proj.weight_scale": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.2.gate_proj.weight": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.2.gate_proj.weight_scale": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.2.up_proj.weight": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.2.up_proj.weight_scale": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.20.down_proj.weight": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.20.down_proj.weight_scale": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.20.gate_proj.weight": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.20.gate_proj.weight_scale": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.20.up_proj.weight": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.20.up_proj.weight_scale": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.21.down_proj.weight": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.21.down_proj.weight_scale": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.21.gate_proj.weight": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.21.gate_proj.weight_scale": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.21.up_proj.weight": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.21.up_proj.weight_scale": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.22.down_proj.weight": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.22.down_proj.weight_scale": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.22.gate_proj.weight": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.22.gate_proj.weight_scale": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.22.up_proj.weight": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.22.up_proj.weight_scale": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.23.down_proj.weight": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.23.down_proj.weight_scale": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.23.gate_proj.weight": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.23.gate_proj.weight_scale": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.23.up_proj.weight": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.23.up_proj.weight_scale": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.24.down_proj.weight": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.24.down_proj.weight_scale": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.24.gate_proj.weight": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.24.gate_proj.weight_scale": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.24.up_proj.weight": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.24.up_proj.weight_scale": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.25.down_proj.weight": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.25.down_proj.weight_scale": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.25.gate_proj.weight": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.25.gate_proj.weight_scale": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.25.up_proj.weight": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.25.up_proj.weight_scale": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.26.down_proj.weight": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.26.down_proj.weight_scale": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.26.gate_proj.weight": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.26.gate_proj.weight_scale": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.26.up_proj.weight": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.26.up_proj.weight_scale": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.27.down_proj.weight": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.27.down_proj.weight_scale": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.27.gate_proj.weight": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.27.gate_proj.weight_scale": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.27.up_proj.weight": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.27.up_proj.weight_scale": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.28.down_proj.weight": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.28.down_proj.weight_scale": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.28.gate_proj.weight": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.28.gate_proj.weight_scale": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.28.up_proj.weight": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.28.up_proj.weight_scale": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.29.down_proj.weight": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.29.down_proj.weight_scale": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.29.gate_proj.weight": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.29.gate_proj.weight_scale": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.29.up_proj.weight": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.29.up_proj.weight_scale": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.3.down_proj.weight": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.3.down_proj.weight_scale": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.3.gate_proj.weight": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.3.gate_proj.weight_scale": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.3.up_proj.weight": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.3.up_proj.weight_scale": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.30.down_proj.weight": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.30.down_proj.weight_scale": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.30.gate_proj.weight": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.30.gate_proj.weight_scale": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.30.up_proj.weight": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.30.up_proj.weight_scale": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.31.down_proj.weight": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.31.down_proj.weight_scale": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.31.gate_proj.weight": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.31.gate_proj.weight_scale": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.31.up_proj.weight": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.31.up_proj.weight_scale": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.32.down_proj.weight": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.32.down_proj.weight_scale": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.32.gate_proj.weight": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.32.gate_proj.weight_scale": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.32.up_proj.weight": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.32.up_proj.weight_scale": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.33.down_proj.weight": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.33.down_proj.weight_scale": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.33.gate_proj.weight": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.33.gate_proj.weight_scale": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.33.up_proj.weight": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.33.up_proj.weight_scale": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.34.down_proj.weight": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.34.down_proj.weight_scale": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.34.gate_proj.weight": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.34.gate_proj.weight_scale": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.34.up_proj.weight": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.34.up_proj.weight_scale": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.35.down_proj.weight": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.35.down_proj.weight_scale": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.35.gate_proj.weight": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.35.gate_proj.weight_scale": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.35.up_proj.weight": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.35.up_proj.weight_scale": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.36.down_proj.weight": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.36.down_proj.weight_scale": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.36.gate_proj.weight": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.36.gate_proj.weight_scale": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.36.up_proj.weight": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.36.up_proj.weight_scale": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.37.down_proj.weight": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.37.down_proj.weight_scale": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.37.gate_proj.weight": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.37.gate_proj.weight_scale": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.37.up_proj.weight": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.37.up_proj.weight_scale": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.38.down_proj.weight": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.38.down_proj.weight_scale": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.38.gate_proj.weight": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.38.gate_proj.weight_scale": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.38.up_proj.weight": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.38.up_proj.weight_scale": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.39.down_proj.weight": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.39.down_proj.weight_scale": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.39.gate_proj.weight": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.39.gate_proj.weight_scale": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.39.up_proj.weight": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.39.up_proj.weight_scale": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.4.down_proj.weight": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.4.down_proj.weight_scale": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.4.gate_proj.weight": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.4.gate_proj.weight_scale": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.4.up_proj.weight": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.4.up_proj.weight_scale": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.40.down_proj.weight": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.40.down_proj.weight_scale": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.40.gate_proj.weight": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.40.gate_proj.weight_scale": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.40.up_proj.weight": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.40.up_proj.weight_scale": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.41.down_proj.weight": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.41.down_proj.weight_scale": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.41.gate_proj.weight": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.41.gate_proj.weight_scale": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.41.up_proj.weight": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.41.up_proj.weight_scale": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.42.down_proj.weight": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.42.down_proj.weight_scale": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.42.gate_proj.weight": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.42.gate_proj.weight_scale": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.42.up_proj.weight": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.42.up_proj.weight_scale": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.43.down_proj.weight": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.43.down_proj.weight_scale": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.43.gate_proj.weight": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.43.gate_proj.weight_scale": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.43.up_proj.weight": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.43.up_proj.weight_scale": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.44.down_proj.weight": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.44.down_proj.weight_scale": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.44.gate_proj.weight": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.44.gate_proj.weight_scale": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.44.up_proj.weight": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.44.up_proj.weight_scale": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.45.down_proj.weight": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.45.down_proj.weight_scale": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.45.gate_proj.weight": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.45.gate_proj.weight_scale": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.45.up_proj.weight": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.45.up_proj.weight_scale": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.46.down_proj.weight": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.46.down_proj.weight_scale": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.46.gate_proj.weight": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.46.gate_proj.weight_scale": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.46.up_proj.weight": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.46.up_proj.weight_scale": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.47.down_proj.weight": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.47.down_proj.weight_scale": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.47.gate_proj.weight": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.47.gate_proj.weight_scale": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.47.up_proj.weight": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.47.up_proj.weight_scale": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.48.down_proj.weight": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.48.down_proj.weight_scale": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.48.gate_proj.weight": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.48.gate_proj.weight_scale": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.48.up_proj.weight": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.48.up_proj.weight_scale": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.49.down_proj.weight": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.49.down_proj.weight_scale": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.49.gate_proj.weight": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.49.gate_proj.weight_scale": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.49.up_proj.weight": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.49.up_proj.weight_scale": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.5.down_proj.weight": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.5.down_proj.weight_scale": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.5.gate_proj.weight": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.5.gate_proj.weight_scale": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.5.up_proj.weight": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.5.up_proj.weight_scale": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.50.down_proj.weight": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.50.down_proj.weight_scale": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.50.gate_proj.weight": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.50.gate_proj.weight_scale": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.50.up_proj.weight": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.50.up_proj.weight_scale": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.51.down_proj.weight": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.51.down_proj.weight_scale": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.51.gate_proj.weight": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.51.gate_proj.weight_scale": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.51.up_proj.weight": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.51.up_proj.weight_scale": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.52.down_proj.weight": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.52.down_proj.weight_scale": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.52.gate_proj.weight": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.52.gate_proj.weight_scale": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.52.up_proj.weight": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.52.up_proj.weight_scale": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.53.down_proj.weight": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.53.down_proj.weight_scale": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.53.gate_proj.weight": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.53.gate_proj.weight_scale": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.53.up_proj.weight": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.53.up_proj.weight_scale": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.54.down_proj.weight": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.54.down_proj.weight_scale": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.54.gate_proj.weight": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.54.gate_proj.weight_scale": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.54.up_proj.weight": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.54.up_proj.weight_scale": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.55.down_proj.weight": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.55.down_proj.weight_scale": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.55.gate_proj.weight": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.55.gate_proj.weight_scale": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.55.up_proj.weight": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.55.up_proj.weight_scale": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.56.down_proj.weight": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.56.down_proj.weight_scale": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.56.gate_proj.weight": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.56.gate_proj.weight_scale": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.56.up_proj.weight": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.56.up_proj.weight_scale": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.57.down_proj.weight": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.57.down_proj.weight_scale": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.57.gate_proj.weight": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.57.gate_proj.weight_scale": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.57.up_proj.weight": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.57.up_proj.weight_scale": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.58.down_proj.weight": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.58.down_proj.weight_scale": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.58.gate_proj.weight": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.58.gate_proj.weight_scale": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.58.up_proj.weight": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.58.up_proj.weight_scale": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.59.down_proj.weight": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.59.down_proj.weight_scale": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.59.gate_proj.weight": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.59.gate_proj.weight_scale": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.59.up_proj.weight": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.59.up_proj.weight_scale": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.6.down_proj.weight": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.6.down_proj.weight_scale": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.6.gate_proj.weight": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.6.gate_proj.weight_scale": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.6.up_proj.weight": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.6.up_proj.weight_scale": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.60.down_proj.weight": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.60.down_proj.weight_scale": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.60.gate_proj.weight": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.60.gate_proj.weight_scale": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.60.up_proj.weight": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.60.up_proj.weight_scale": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.61.down_proj.weight": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.61.down_proj.weight_scale": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.61.gate_proj.weight": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.61.gate_proj.weight_scale": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.61.up_proj.weight": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.61.up_proj.weight_scale": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.62.down_proj.weight": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.62.down_proj.weight_scale": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.62.gate_proj.weight": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.62.gate_proj.weight_scale": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.62.up_proj.weight": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.62.up_proj.weight_scale": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.63.down_proj.weight": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.63.down_proj.weight_scale": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.63.gate_proj.weight": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.63.gate_proj.weight_scale": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.63.up_proj.weight": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.63.up_proj.weight_scale": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.64.down_proj.weight": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.64.down_proj.weight_scale": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.64.gate_proj.weight": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.64.gate_proj.weight_scale": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.64.up_proj.weight": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.64.up_proj.weight_scale": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.65.down_proj.weight": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.65.down_proj.weight_scale": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.65.gate_proj.weight": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.65.gate_proj.weight_scale": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.65.up_proj.weight": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.65.up_proj.weight_scale": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.66.down_proj.weight": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.66.down_proj.weight_scale": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.66.gate_proj.weight": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.66.gate_proj.weight_scale": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.66.up_proj.weight": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.66.up_proj.weight_scale": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.67.down_proj.weight": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.67.down_proj.weight_scale": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.67.gate_proj.weight": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.67.gate_proj.weight_scale": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.67.up_proj.weight": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.67.up_proj.weight_scale": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.68.down_proj.weight": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.68.down_proj.weight_scale": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.68.gate_proj.weight": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.68.gate_proj.weight_scale": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.68.up_proj.weight": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.68.up_proj.weight_scale": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.69.down_proj.weight": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.69.down_proj.weight_scale": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.69.gate_proj.weight": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.69.gate_proj.weight_scale": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.69.up_proj.weight": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.69.up_proj.weight_scale": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.7.down_proj.weight": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.7.down_proj.weight_scale": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.7.gate_proj.weight": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.7.gate_proj.weight_scale": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.7.up_proj.weight": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.7.up_proj.weight_scale": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.70.down_proj.weight": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.70.down_proj.weight_scale": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.70.gate_proj.weight": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.70.gate_proj.weight_scale": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.70.up_proj.weight": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.70.up_proj.weight_scale": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.71.down_proj.weight": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.71.down_proj.weight_scale": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.71.gate_proj.weight": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.71.gate_proj.weight_scale": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.71.up_proj.weight": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.71.up_proj.weight_scale": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.72.down_proj.weight": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.72.down_proj.weight_scale": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.72.gate_proj.weight": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.72.gate_proj.weight_scale": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.72.up_proj.weight": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.72.up_proj.weight_scale": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.73.down_proj.weight": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.73.down_proj.weight_scale": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.73.gate_proj.weight": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.73.gate_proj.weight_scale": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.73.up_proj.weight": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.73.up_proj.weight_scale": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.74.down_proj.weight": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.74.down_proj.weight_scale": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.74.gate_proj.weight": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.74.gate_proj.weight_scale": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.74.up_proj.weight": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.74.up_proj.weight_scale": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.75.down_proj.weight": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.75.down_proj.weight_scale": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.75.gate_proj.weight": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.75.gate_proj.weight_scale": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.75.up_proj.weight": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.75.up_proj.weight_scale": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.76.down_proj.weight": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.76.down_proj.weight_scale": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.76.gate_proj.weight": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.76.gate_proj.weight_scale": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.76.up_proj.weight": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.76.up_proj.weight_scale": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.77.down_proj.weight": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.77.down_proj.weight_scale": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.77.gate_proj.weight": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.77.gate_proj.weight_scale": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.77.up_proj.weight": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.77.up_proj.weight_scale": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.78.down_proj.weight": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.78.down_proj.weight_scale": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.78.gate_proj.weight": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.78.gate_proj.weight_scale": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.78.up_proj.weight": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.78.up_proj.weight_scale": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.79.down_proj.weight": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.79.down_proj.weight_scale": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.79.gate_proj.weight": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.79.gate_proj.weight_scale": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.79.up_proj.weight": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.79.up_proj.weight_scale": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.8.down_proj.weight": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.8.down_proj.weight_scale": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.8.gate_proj.weight": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.8.gate_proj.weight_scale": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.8.up_proj.weight": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.8.up_proj.weight_scale": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.80.down_proj.weight": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.80.down_proj.weight_scale": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.80.gate_proj.weight": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.80.gate_proj.weight_scale": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.80.up_proj.weight": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.80.up_proj.weight_scale": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.81.down_proj.weight": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.81.down_proj.weight_scale": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.81.gate_proj.weight": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.81.gate_proj.weight_scale": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.81.up_proj.weight": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.81.up_proj.weight_scale": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.82.down_proj.weight": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.82.down_proj.weight_scale": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.82.gate_proj.weight": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.82.gate_proj.weight_scale": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.82.up_proj.weight": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.82.up_proj.weight_scale": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.83.down_proj.weight": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.83.down_proj.weight_scale": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.83.gate_proj.weight": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.83.gate_proj.weight_scale": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.83.up_proj.weight": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.83.up_proj.weight_scale": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.84.down_proj.weight": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.84.down_proj.weight_scale": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.84.gate_proj.weight": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.84.gate_proj.weight_scale": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.84.up_proj.weight": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.84.up_proj.weight_scale": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.85.down_proj.weight": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.85.down_proj.weight_scale": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.85.gate_proj.weight": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.85.gate_proj.weight_scale": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.85.up_proj.weight": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.85.up_proj.weight_scale": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.86.down_proj.weight": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.86.down_proj.weight_scale": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.86.gate_proj.weight": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.86.gate_proj.weight_scale": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.86.up_proj.weight": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.86.up_proj.weight_scale": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.87.down_proj.weight": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.87.down_proj.weight_scale": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.87.gate_proj.weight": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.87.gate_proj.weight_scale": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.87.up_proj.weight": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.87.up_proj.weight_scale": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.88.down_proj.weight": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.88.down_proj.weight_scale": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.88.gate_proj.weight": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.88.gate_proj.weight_scale": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.88.up_proj.weight": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.88.up_proj.weight_scale": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.89.down_proj.weight": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.89.down_proj.weight_scale": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.89.gate_proj.weight": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.89.gate_proj.weight_scale": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.89.up_proj.weight": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.89.up_proj.weight_scale": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.9.down_proj.weight": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.9.down_proj.weight_scale": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.9.gate_proj.weight": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.9.gate_proj.weight_scale": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.9.up_proj.weight": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.9.up_proj.weight_scale": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.90.down_proj.weight": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.90.down_proj.weight_scale": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.90.gate_proj.weight": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.90.gate_proj.weight_scale": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.90.up_proj.weight": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.90.up_proj.weight_scale": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.91.down_proj.weight": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.91.down_proj.weight_scale": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.91.gate_proj.weight": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.91.gate_proj.weight_scale": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.91.up_proj.weight": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.91.up_proj.weight_scale": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.92.down_proj.weight": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.92.down_proj.weight_scale": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.92.gate_proj.weight": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.92.gate_proj.weight_scale": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.92.up_proj.weight": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.92.up_proj.weight_scale": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.93.down_proj.weight": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.93.down_proj.weight_scale": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.93.gate_proj.weight": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.93.gate_proj.weight_scale": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.93.up_proj.weight": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.93.up_proj.weight_scale": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.94.down_proj.weight": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.94.down_proj.weight_scale": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.94.gate_proj.weight": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.94.gate_proj.weight_scale": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.94.up_proj.weight": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.94.up_proj.weight_scale": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.95.down_proj.weight": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.95.down_proj.weight_scale": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.95.gate_proj.weight": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.95.gate_proj.weight_scale": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.95.up_proj.weight": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.95.up_proj.weight_scale": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.96.down_proj.weight": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.96.down_proj.weight_scale": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.96.gate_proj.weight": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.96.gate_proj.weight_scale": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.96.up_proj.weight": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.96.up_proj.weight_scale": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.97.down_proj.weight": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.97.down_proj.weight_scale": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.97.gate_proj.weight": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.97.gate_proj.weight_scale": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.97.up_proj.weight": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.97.up_proj.weight_scale": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.98.down_proj.weight": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.98.down_proj.weight_scale": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.98.gate_proj.weight": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.98.gate_proj.weight_scale": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.98.up_proj.weight": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.98.up_proj.weight_scale": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.99.down_proj.weight": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.99.down_proj.weight_scale": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.99.gate_proj.weight": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.99.gate_proj.weight_scale": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.99.up_proj.weight": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.99.up_proj.weight_scale": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.gate.e_score_correction_bias": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.gate.weight": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.shared_experts.down_proj.weight": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.shared_experts.down_proj.weight_scale": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.shared_experts.gate_proj.weight": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.shared_experts.gate_proj.weight_scale": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.shared_experts.up_proj.weight": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.shared_experts.up_proj.weight_scale": "model-00091-of-00092.safetensors",
+ "model.layers.90.post_attention_layernorm.weight": "model-00091-of-00092.safetensors",
+ "model.layers.90.self_attn.k_norm.weight": "model-00091-of-00092.safetensors",
+ "model.layers.90.self_attn.k_proj.bias": "model-00091-of-00092.safetensors",
+ "model.layers.90.self_attn.k_proj.weight": "model-00091-of-00092.safetensors",
+ "model.layers.90.self_attn.k_proj.weight_scale": "model-00091-of-00092.safetensors",
+ "model.layers.90.self_attn.o_proj.weight": "model-00091-of-00092.safetensors",
+ "model.layers.90.self_attn.o_proj.weight_scale": "model-00091-of-00092.safetensors",
+ "model.layers.90.self_attn.q_norm.weight": "model-00091-of-00092.safetensors",
+ "model.layers.90.self_attn.q_proj.bias": "model-00091-of-00092.safetensors",
+ "model.layers.90.self_attn.q_proj.weight": "model-00091-of-00092.safetensors",
+ "model.layers.90.self_attn.q_proj.weight_scale": "model-00091-of-00092.safetensors",
+ "model.layers.90.self_attn.v_proj.bias": "model-00091-of-00092.safetensors",
+ "model.layers.90.self_attn.v_proj.weight": "model-00091-of-00092.safetensors",
+ "model.layers.90.self_attn.v_proj.weight_scale": "model-00091-of-00092.safetensors",
+ "lm_head.weight": "model-00092-of-00092.safetensors",
+ "model.layers.91.input_layernorm.weight": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.0.down_proj.weight": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.0.down_proj.weight_scale": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.0.gate_proj.weight": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.0.gate_proj.weight_scale": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.0.up_proj.weight": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.0.up_proj.weight_scale": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.1.down_proj.weight": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.1.down_proj.weight_scale": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.1.gate_proj.weight": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.1.gate_proj.weight_scale": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.1.up_proj.weight": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.1.up_proj.weight_scale": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.10.down_proj.weight": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.10.down_proj.weight_scale": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.10.gate_proj.weight": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.10.gate_proj.weight_scale": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.10.up_proj.weight": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.10.up_proj.weight_scale": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.100.down_proj.weight": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.100.down_proj.weight_scale": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.100.gate_proj.weight": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.100.gate_proj.weight_scale": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.100.up_proj.weight": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.100.up_proj.weight_scale": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.101.down_proj.weight": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.101.down_proj.weight_scale": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.101.gate_proj.weight": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.101.gate_proj.weight_scale": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.101.up_proj.weight": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.101.up_proj.weight_scale": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.102.down_proj.weight": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.102.down_proj.weight_scale": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.102.gate_proj.weight": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.102.gate_proj.weight_scale": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.102.up_proj.weight": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.102.up_proj.weight_scale": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.103.down_proj.weight": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.103.down_proj.weight_scale": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.103.gate_proj.weight": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.103.gate_proj.weight_scale": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.103.up_proj.weight": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.103.up_proj.weight_scale": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.104.down_proj.weight": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.104.down_proj.weight_scale": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.104.gate_proj.weight": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.104.gate_proj.weight_scale": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.104.up_proj.weight": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.104.up_proj.weight_scale": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.105.down_proj.weight": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.105.down_proj.weight_scale": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.105.gate_proj.weight": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.105.gate_proj.weight_scale": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.105.up_proj.weight": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.105.up_proj.weight_scale": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.106.down_proj.weight": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.106.down_proj.weight_scale": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.106.gate_proj.weight": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.106.gate_proj.weight_scale": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.106.up_proj.weight": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.106.up_proj.weight_scale": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.107.down_proj.weight": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.107.down_proj.weight_scale": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.107.gate_proj.weight": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.107.gate_proj.weight_scale": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.107.up_proj.weight": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.107.up_proj.weight_scale": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.108.down_proj.weight": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.108.down_proj.weight_scale": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.108.gate_proj.weight": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.108.gate_proj.weight_scale": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.108.up_proj.weight": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.108.up_proj.weight_scale": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.109.down_proj.weight": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.109.down_proj.weight_scale": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.109.gate_proj.weight": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.109.gate_proj.weight_scale": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.109.up_proj.weight": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.109.up_proj.weight_scale": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.11.down_proj.weight": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.11.down_proj.weight_scale": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.11.gate_proj.weight": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.11.gate_proj.weight_scale": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.11.up_proj.weight": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.11.up_proj.weight_scale": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.110.down_proj.weight": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.110.down_proj.weight_scale": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.110.gate_proj.weight": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.110.gate_proj.weight_scale": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.110.up_proj.weight": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.110.up_proj.weight_scale": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.111.down_proj.weight": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.111.down_proj.weight_scale": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.111.gate_proj.weight": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.111.gate_proj.weight_scale": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.111.up_proj.weight": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.111.up_proj.weight_scale": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.112.down_proj.weight": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.112.down_proj.weight_scale": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.112.gate_proj.weight": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.112.gate_proj.weight_scale": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.112.up_proj.weight": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.112.up_proj.weight_scale": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.113.down_proj.weight": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.113.down_proj.weight_scale": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.113.gate_proj.weight": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.113.gate_proj.weight_scale": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.113.up_proj.weight": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.113.up_proj.weight_scale": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.114.down_proj.weight": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.114.down_proj.weight_scale": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.114.gate_proj.weight": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.114.gate_proj.weight_scale": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.114.up_proj.weight": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.114.up_proj.weight_scale": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.115.down_proj.weight": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.115.down_proj.weight_scale": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.115.gate_proj.weight": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.115.gate_proj.weight_scale": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.115.up_proj.weight": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.115.up_proj.weight_scale": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.116.down_proj.weight": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.116.down_proj.weight_scale": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.116.gate_proj.weight": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.116.gate_proj.weight_scale": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.116.up_proj.weight": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.116.up_proj.weight_scale": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.117.down_proj.weight": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.117.down_proj.weight_scale": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.117.gate_proj.weight": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.117.gate_proj.weight_scale": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.117.up_proj.weight": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.117.up_proj.weight_scale": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.118.down_proj.weight": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.118.down_proj.weight_scale": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.118.gate_proj.weight": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.118.gate_proj.weight_scale": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.118.up_proj.weight": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.118.up_proj.weight_scale": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.119.down_proj.weight": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.119.down_proj.weight_scale": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.119.gate_proj.weight": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.119.gate_proj.weight_scale": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.119.up_proj.weight": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.119.up_proj.weight_scale": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.12.down_proj.weight": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.12.down_proj.weight_scale": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.12.gate_proj.weight": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.12.gate_proj.weight_scale": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.12.up_proj.weight": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.12.up_proj.weight_scale": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.120.down_proj.weight": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.120.down_proj.weight_scale": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.120.gate_proj.weight": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.120.gate_proj.weight_scale": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.120.up_proj.weight": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.120.up_proj.weight_scale": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.121.down_proj.weight": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.121.down_proj.weight_scale": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.121.gate_proj.weight": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.121.gate_proj.weight_scale": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.121.up_proj.weight": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.121.up_proj.weight_scale": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.122.down_proj.weight": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.122.down_proj.weight_scale": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.122.gate_proj.weight": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.122.gate_proj.weight_scale": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.122.up_proj.weight": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.122.up_proj.weight_scale": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.123.down_proj.weight": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.123.down_proj.weight_scale": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.123.gate_proj.weight": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.123.gate_proj.weight_scale": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.123.up_proj.weight": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.123.up_proj.weight_scale": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.124.down_proj.weight": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.124.down_proj.weight_scale": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.124.gate_proj.weight": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.124.gate_proj.weight_scale": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.124.up_proj.weight": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.124.up_proj.weight_scale": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.125.down_proj.weight": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.125.down_proj.weight_scale": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.125.gate_proj.weight": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.125.gate_proj.weight_scale": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.125.up_proj.weight": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.125.up_proj.weight_scale": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.126.down_proj.weight": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.126.down_proj.weight_scale": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.126.gate_proj.weight": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.126.gate_proj.weight_scale": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.126.up_proj.weight": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.126.up_proj.weight_scale": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.127.down_proj.weight": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.127.down_proj.weight_scale": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.127.gate_proj.weight": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.127.gate_proj.weight_scale": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.127.up_proj.weight": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.127.up_proj.weight_scale": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.128.down_proj.weight": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.128.down_proj.weight_scale": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.128.gate_proj.weight": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.128.gate_proj.weight_scale": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.128.up_proj.weight": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.128.up_proj.weight_scale": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.129.down_proj.weight": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.129.down_proj.weight_scale": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.129.gate_proj.weight": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.129.gate_proj.weight_scale": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.129.up_proj.weight": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.129.up_proj.weight_scale": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.13.down_proj.weight": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.13.down_proj.weight_scale": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.13.gate_proj.weight": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.13.gate_proj.weight_scale": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.13.up_proj.weight": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.13.up_proj.weight_scale": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.130.down_proj.weight": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.130.down_proj.weight_scale": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.130.gate_proj.weight": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.130.gate_proj.weight_scale": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.130.up_proj.weight": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.130.up_proj.weight_scale": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.131.down_proj.weight": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.131.down_proj.weight_scale": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.131.gate_proj.weight": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.131.gate_proj.weight_scale": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.131.up_proj.weight": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.131.up_proj.weight_scale": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.132.down_proj.weight": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.132.down_proj.weight_scale": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.132.gate_proj.weight": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.132.gate_proj.weight_scale": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.132.up_proj.weight": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.132.up_proj.weight_scale": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.133.down_proj.weight": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.133.down_proj.weight_scale": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.133.gate_proj.weight": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.133.gate_proj.weight_scale": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.133.up_proj.weight": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.133.up_proj.weight_scale": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.134.down_proj.weight": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.134.down_proj.weight_scale": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.134.gate_proj.weight": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.134.gate_proj.weight_scale": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.134.up_proj.weight": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.134.up_proj.weight_scale": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.135.down_proj.weight": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.135.down_proj.weight_scale": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.135.gate_proj.weight": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.135.gate_proj.weight_scale": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.135.up_proj.weight": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.135.up_proj.weight_scale": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.136.down_proj.weight": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.136.down_proj.weight_scale": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.136.gate_proj.weight": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.136.gate_proj.weight_scale": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.136.up_proj.weight": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.136.up_proj.weight_scale": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.137.down_proj.weight": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.137.down_proj.weight_scale": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.137.gate_proj.weight": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.137.gate_proj.weight_scale": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.137.up_proj.weight": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.137.up_proj.weight_scale": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.138.down_proj.weight": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.138.down_proj.weight_scale": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.138.gate_proj.weight": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.138.gate_proj.weight_scale": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.138.up_proj.weight": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.138.up_proj.weight_scale": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.139.down_proj.weight": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.139.down_proj.weight_scale": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.139.gate_proj.weight": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.139.gate_proj.weight_scale": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.139.up_proj.weight": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.139.up_proj.weight_scale": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.14.down_proj.weight": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.14.down_proj.weight_scale": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.14.gate_proj.weight": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.14.gate_proj.weight_scale": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.14.up_proj.weight": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.14.up_proj.weight_scale": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.140.down_proj.weight": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.140.down_proj.weight_scale": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.140.gate_proj.weight": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.140.gate_proj.weight_scale": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.140.up_proj.weight": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.140.up_proj.weight_scale": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.141.down_proj.weight": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.141.down_proj.weight_scale": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.141.gate_proj.weight": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.141.gate_proj.weight_scale": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.141.up_proj.weight": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.141.up_proj.weight_scale": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.142.down_proj.weight": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.142.down_proj.weight_scale": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.142.gate_proj.weight": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.142.gate_proj.weight_scale": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.142.up_proj.weight": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.142.up_proj.weight_scale": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.143.down_proj.weight": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.143.down_proj.weight_scale": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.143.gate_proj.weight": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.143.gate_proj.weight_scale": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.143.up_proj.weight": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.143.up_proj.weight_scale": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.144.down_proj.weight": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.144.down_proj.weight_scale": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.144.gate_proj.weight": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.144.gate_proj.weight_scale": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.144.up_proj.weight": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.144.up_proj.weight_scale": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.145.down_proj.weight": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.145.down_proj.weight_scale": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.145.gate_proj.weight": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.145.gate_proj.weight_scale": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.145.up_proj.weight": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.145.up_proj.weight_scale": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.146.down_proj.weight": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.146.down_proj.weight_scale": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.146.gate_proj.weight": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.146.gate_proj.weight_scale": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.146.up_proj.weight": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.146.up_proj.weight_scale": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.147.down_proj.weight": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.147.down_proj.weight_scale": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.147.gate_proj.weight": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.147.gate_proj.weight_scale": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.147.up_proj.weight": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.147.up_proj.weight_scale": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.148.down_proj.weight": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.148.down_proj.weight_scale": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.148.gate_proj.weight": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.148.gate_proj.weight_scale": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.148.up_proj.weight": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.148.up_proj.weight_scale": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.149.down_proj.weight": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.149.down_proj.weight_scale": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.149.gate_proj.weight": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.149.gate_proj.weight_scale": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.149.up_proj.weight": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.149.up_proj.weight_scale": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.15.down_proj.weight": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.15.down_proj.weight_scale": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.15.gate_proj.weight": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.15.gate_proj.weight_scale": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.15.up_proj.weight": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.15.up_proj.weight_scale": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.150.down_proj.weight": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.150.down_proj.weight_scale": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.150.gate_proj.weight": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.150.gate_proj.weight_scale": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.150.up_proj.weight": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.150.up_proj.weight_scale": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.151.down_proj.weight": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.151.down_proj.weight_scale": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.151.gate_proj.weight": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.151.gate_proj.weight_scale": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.151.up_proj.weight": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.151.up_proj.weight_scale": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.152.down_proj.weight": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.152.down_proj.weight_scale": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.152.gate_proj.weight": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.152.gate_proj.weight_scale": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.152.up_proj.weight": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.152.up_proj.weight_scale": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.153.down_proj.weight": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.153.down_proj.weight_scale": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.153.gate_proj.weight": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.153.gate_proj.weight_scale": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.153.up_proj.weight": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.153.up_proj.weight_scale": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.154.down_proj.weight": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.154.down_proj.weight_scale": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.154.gate_proj.weight": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.154.gate_proj.weight_scale": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.154.up_proj.weight": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.154.up_proj.weight_scale": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.155.down_proj.weight": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.155.down_proj.weight_scale": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.155.gate_proj.weight": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.155.gate_proj.weight_scale": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.155.up_proj.weight": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.155.up_proj.weight_scale": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.156.down_proj.weight": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.156.down_proj.weight_scale": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.156.gate_proj.weight": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.156.gate_proj.weight_scale": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.156.up_proj.weight": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.156.up_proj.weight_scale": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.157.down_proj.weight": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.157.down_proj.weight_scale": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.157.gate_proj.weight": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.157.gate_proj.weight_scale": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.157.up_proj.weight": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.157.up_proj.weight_scale": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.158.down_proj.weight": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.158.down_proj.weight_scale": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.158.gate_proj.weight": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.158.gate_proj.weight_scale": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.158.up_proj.weight": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.158.up_proj.weight_scale": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.159.down_proj.weight": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.159.down_proj.weight_scale": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.159.gate_proj.weight": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.159.gate_proj.weight_scale": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.159.up_proj.weight": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.159.up_proj.weight_scale": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.16.down_proj.weight": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.16.down_proj.weight_scale": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.16.gate_proj.weight": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.16.gate_proj.weight_scale": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.16.up_proj.weight": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.16.up_proj.weight_scale": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.17.down_proj.weight": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.17.down_proj.weight_scale": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.17.gate_proj.weight": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.17.gate_proj.weight_scale": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.17.up_proj.weight": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.17.up_proj.weight_scale": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.18.down_proj.weight": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.18.down_proj.weight_scale": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.18.gate_proj.weight": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.18.gate_proj.weight_scale": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.18.up_proj.weight": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.18.up_proj.weight_scale": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.19.down_proj.weight": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.19.down_proj.weight_scale": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.19.gate_proj.weight": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.19.gate_proj.weight_scale": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.19.up_proj.weight": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.19.up_proj.weight_scale": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.2.down_proj.weight": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.2.down_proj.weight_scale": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.2.gate_proj.weight": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.2.gate_proj.weight_scale": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.2.up_proj.weight": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.2.up_proj.weight_scale": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.20.down_proj.weight": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.20.down_proj.weight_scale": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.20.gate_proj.weight": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.20.gate_proj.weight_scale": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.20.up_proj.weight": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.20.up_proj.weight_scale": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.21.down_proj.weight": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.21.down_proj.weight_scale": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.21.gate_proj.weight": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.21.gate_proj.weight_scale": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.21.up_proj.weight": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.21.up_proj.weight_scale": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.22.down_proj.weight": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.22.down_proj.weight_scale": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.22.gate_proj.weight": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.22.gate_proj.weight_scale": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.22.up_proj.weight": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.22.up_proj.weight_scale": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.23.down_proj.weight": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.23.down_proj.weight_scale": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.23.gate_proj.weight": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.23.gate_proj.weight_scale": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.23.up_proj.weight": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.23.up_proj.weight_scale": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.24.down_proj.weight": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.24.down_proj.weight_scale": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.24.gate_proj.weight": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.24.gate_proj.weight_scale": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.24.up_proj.weight": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.24.up_proj.weight_scale": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.25.down_proj.weight": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.25.down_proj.weight_scale": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.25.gate_proj.weight": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.25.gate_proj.weight_scale": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.25.up_proj.weight": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.25.up_proj.weight_scale": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.26.down_proj.weight": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.26.down_proj.weight_scale": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.26.gate_proj.weight": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.26.gate_proj.weight_scale": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.26.up_proj.weight": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.26.up_proj.weight_scale": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.27.down_proj.weight": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.27.down_proj.weight_scale": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.27.gate_proj.weight": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.27.gate_proj.weight_scale": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.27.up_proj.weight": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.27.up_proj.weight_scale": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.28.down_proj.weight": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.28.down_proj.weight_scale": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.28.gate_proj.weight": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.28.gate_proj.weight_scale": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.28.up_proj.weight": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.28.up_proj.weight_scale": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.29.down_proj.weight": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.29.down_proj.weight_scale": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.29.gate_proj.weight": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.29.gate_proj.weight_scale": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.29.up_proj.weight": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.29.up_proj.weight_scale": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.3.down_proj.weight": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.3.down_proj.weight_scale": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.3.gate_proj.weight": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.3.gate_proj.weight_scale": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.3.up_proj.weight": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.3.up_proj.weight_scale": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.30.down_proj.weight": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.30.down_proj.weight_scale": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.30.gate_proj.weight": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.30.gate_proj.weight_scale": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.30.up_proj.weight": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.30.up_proj.weight_scale": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.31.down_proj.weight": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.31.down_proj.weight_scale": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.31.gate_proj.weight": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.31.gate_proj.weight_scale": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.31.up_proj.weight": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.31.up_proj.weight_scale": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.32.down_proj.weight": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.32.down_proj.weight_scale": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.32.gate_proj.weight": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.32.gate_proj.weight_scale": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.32.up_proj.weight": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.32.up_proj.weight_scale": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.33.down_proj.weight": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.33.down_proj.weight_scale": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.33.gate_proj.weight": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.33.gate_proj.weight_scale": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.33.up_proj.weight": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.33.up_proj.weight_scale": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.34.down_proj.weight": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.34.down_proj.weight_scale": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.34.gate_proj.weight": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.34.gate_proj.weight_scale": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.34.up_proj.weight": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.34.up_proj.weight_scale": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.35.down_proj.weight": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.35.down_proj.weight_scale": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.35.gate_proj.weight": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.35.gate_proj.weight_scale": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.35.up_proj.weight": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.35.up_proj.weight_scale": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.36.down_proj.weight": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.36.down_proj.weight_scale": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.36.gate_proj.weight": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.36.gate_proj.weight_scale": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.36.up_proj.weight": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.36.up_proj.weight_scale": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.37.down_proj.weight": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.37.down_proj.weight_scale": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.37.gate_proj.weight": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.37.gate_proj.weight_scale": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.37.up_proj.weight": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.37.up_proj.weight_scale": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.38.down_proj.weight": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.38.down_proj.weight_scale": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.38.gate_proj.weight": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.38.gate_proj.weight_scale": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.38.up_proj.weight": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.38.up_proj.weight_scale": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.39.down_proj.weight": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.39.down_proj.weight_scale": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.39.gate_proj.weight": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.39.gate_proj.weight_scale": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.39.up_proj.weight": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.39.up_proj.weight_scale": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.4.down_proj.weight": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.4.down_proj.weight_scale": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.4.gate_proj.weight": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.4.gate_proj.weight_scale": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.4.up_proj.weight": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.4.up_proj.weight_scale": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.40.down_proj.weight": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.40.down_proj.weight_scale": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.40.gate_proj.weight": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.40.gate_proj.weight_scale": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.40.up_proj.weight": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.40.up_proj.weight_scale": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.41.down_proj.weight": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.41.down_proj.weight_scale": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.41.gate_proj.weight": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.41.gate_proj.weight_scale": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.41.up_proj.weight": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.41.up_proj.weight_scale": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.42.down_proj.weight": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.42.down_proj.weight_scale": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.42.gate_proj.weight": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.42.gate_proj.weight_scale": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.42.up_proj.weight": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.42.up_proj.weight_scale": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.43.down_proj.weight": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.43.down_proj.weight_scale": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.43.gate_proj.weight": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.43.gate_proj.weight_scale": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.43.up_proj.weight": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.43.up_proj.weight_scale": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.44.down_proj.weight": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.44.down_proj.weight_scale": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.44.gate_proj.weight": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.44.gate_proj.weight_scale": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.44.up_proj.weight": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.44.up_proj.weight_scale": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.45.down_proj.weight": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.45.down_proj.weight_scale": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.45.gate_proj.weight": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.45.gate_proj.weight_scale": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.45.up_proj.weight": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.45.up_proj.weight_scale": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.46.down_proj.weight": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.46.down_proj.weight_scale": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.46.gate_proj.weight": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.46.gate_proj.weight_scale": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.46.up_proj.weight": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.46.up_proj.weight_scale": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.47.down_proj.weight": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.47.down_proj.weight_scale": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.47.gate_proj.weight": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.47.gate_proj.weight_scale": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.47.up_proj.weight": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.47.up_proj.weight_scale": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.48.down_proj.weight": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.48.down_proj.weight_scale": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.48.gate_proj.weight": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.48.gate_proj.weight_scale": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.48.up_proj.weight": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.48.up_proj.weight_scale": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.49.down_proj.weight": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.49.down_proj.weight_scale": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.49.gate_proj.weight": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.49.gate_proj.weight_scale": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.49.up_proj.weight": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.49.up_proj.weight_scale": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.5.down_proj.weight": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.5.down_proj.weight_scale": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.5.gate_proj.weight": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.5.gate_proj.weight_scale": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.5.up_proj.weight": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.5.up_proj.weight_scale": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.50.down_proj.weight": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.50.down_proj.weight_scale": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.50.gate_proj.weight": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.50.gate_proj.weight_scale": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.50.up_proj.weight": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.50.up_proj.weight_scale": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.51.down_proj.weight": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.51.down_proj.weight_scale": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.51.gate_proj.weight": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.51.gate_proj.weight_scale": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.51.up_proj.weight": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.51.up_proj.weight_scale": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.52.down_proj.weight": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.52.down_proj.weight_scale": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.52.gate_proj.weight": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.52.gate_proj.weight_scale": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.52.up_proj.weight": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.52.up_proj.weight_scale": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.53.down_proj.weight": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.53.down_proj.weight_scale": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.53.gate_proj.weight": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.53.gate_proj.weight_scale": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.53.up_proj.weight": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.53.up_proj.weight_scale": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.54.down_proj.weight": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.54.down_proj.weight_scale": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.54.gate_proj.weight": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.54.gate_proj.weight_scale": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.54.up_proj.weight": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.54.up_proj.weight_scale": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.55.down_proj.weight": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.55.down_proj.weight_scale": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.55.gate_proj.weight": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.55.gate_proj.weight_scale": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.55.up_proj.weight": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.55.up_proj.weight_scale": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.56.down_proj.weight": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.56.down_proj.weight_scale": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.56.gate_proj.weight": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.56.gate_proj.weight_scale": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.56.up_proj.weight": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.56.up_proj.weight_scale": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.57.down_proj.weight": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.57.down_proj.weight_scale": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.57.gate_proj.weight": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.57.gate_proj.weight_scale": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.57.up_proj.weight": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.57.up_proj.weight_scale": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.58.down_proj.weight": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.58.down_proj.weight_scale": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.58.gate_proj.weight": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.58.gate_proj.weight_scale": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.58.up_proj.weight": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.58.up_proj.weight_scale": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.59.down_proj.weight": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.59.down_proj.weight_scale": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.59.gate_proj.weight": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.59.gate_proj.weight_scale": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.59.up_proj.weight": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.59.up_proj.weight_scale": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.6.down_proj.weight": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.6.down_proj.weight_scale": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.6.gate_proj.weight": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.6.gate_proj.weight_scale": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.6.up_proj.weight": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.6.up_proj.weight_scale": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.60.down_proj.weight": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.60.down_proj.weight_scale": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.60.gate_proj.weight": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.60.gate_proj.weight_scale": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.60.up_proj.weight": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.60.up_proj.weight_scale": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.61.down_proj.weight": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.61.down_proj.weight_scale": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.61.gate_proj.weight": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.61.gate_proj.weight_scale": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.61.up_proj.weight": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.61.up_proj.weight_scale": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.62.down_proj.weight": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.62.down_proj.weight_scale": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.62.gate_proj.weight": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.62.gate_proj.weight_scale": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.62.up_proj.weight": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.62.up_proj.weight_scale": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.63.down_proj.weight": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.63.down_proj.weight_scale": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.63.gate_proj.weight": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.63.gate_proj.weight_scale": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.63.up_proj.weight": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.63.up_proj.weight_scale": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.64.down_proj.weight": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.64.down_proj.weight_scale": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.64.gate_proj.weight": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.64.gate_proj.weight_scale": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.64.up_proj.weight": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.64.up_proj.weight_scale": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.65.down_proj.weight": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.65.down_proj.weight_scale": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.65.gate_proj.weight": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.65.gate_proj.weight_scale": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.65.up_proj.weight": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.65.up_proj.weight_scale": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.66.down_proj.weight": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.66.down_proj.weight_scale": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.66.gate_proj.weight": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.66.gate_proj.weight_scale": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.66.up_proj.weight": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.66.up_proj.weight_scale": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.67.down_proj.weight": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.67.down_proj.weight_scale": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.67.gate_proj.weight": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.67.gate_proj.weight_scale": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.67.up_proj.weight": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.67.up_proj.weight_scale": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.68.down_proj.weight": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.68.down_proj.weight_scale": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.68.gate_proj.weight": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.68.gate_proj.weight_scale": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.68.up_proj.weight": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.68.up_proj.weight_scale": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.69.down_proj.weight": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.69.down_proj.weight_scale": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.69.gate_proj.weight": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.69.gate_proj.weight_scale": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.69.up_proj.weight": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.69.up_proj.weight_scale": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.7.down_proj.weight": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.7.down_proj.weight_scale": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.7.gate_proj.weight": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.7.gate_proj.weight_scale": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.7.up_proj.weight": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.7.up_proj.weight_scale": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.70.down_proj.weight": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.70.down_proj.weight_scale": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.70.gate_proj.weight": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.70.gate_proj.weight_scale": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.70.up_proj.weight": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.70.up_proj.weight_scale": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.71.down_proj.weight": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.71.down_proj.weight_scale": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.71.gate_proj.weight": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.71.gate_proj.weight_scale": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.71.up_proj.weight": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.71.up_proj.weight_scale": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.72.down_proj.weight": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.72.down_proj.weight_scale": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.72.gate_proj.weight": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.72.gate_proj.weight_scale": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.72.up_proj.weight": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.72.up_proj.weight_scale": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.73.down_proj.weight": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.73.down_proj.weight_scale": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.73.gate_proj.weight": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.73.gate_proj.weight_scale": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.73.up_proj.weight": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.73.up_proj.weight_scale": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.74.down_proj.weight": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.74.down_proj.weight_scale": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.74.gate_proj.weight": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.74.gate_proj.weight_scale": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.74.up_proj.weight": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.74.up_proj.weight_scale": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.75.down_proj.weight": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.75.down_proj.weight_scale": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.75.gate_proj.weight": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.75.gate_proj.weight_scale": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.75.up_proj.weight": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.75.up_proj.weight_scale": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.76.down_proj.weight": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.76.down_proj.weight_scale": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.76.gate_proj.weight": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.76.gate_proj.weight_scale": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.76.up_proj.weight": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.76.up_proj.weight_scale": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.77.down_proj.weight": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.77.down_proj.weight_scale": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.77.gate_proj.weight": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.77.gate_proj.weight_scale": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.77.up_proj.weight": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.77.up_proj.weight_scale": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.78.down_proj.weight": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.78.down_proj.weight_scale": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.78.gate_proj.weight": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.78.gate_proj.weight_scale": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.78.up_proj.weight": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.78.up_proj.weight_scale": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.79.down_proj.weight": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.79.down_proj.weight_scale": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.79.gate_proj.weight": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.79.gate_proj.weight_scale": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.79.up_proj.weight": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.79.up_proj.weight_scale": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.8.down_proj.weight": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.8.down_proj.weight_scale": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.8.gate_proj.weight": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.8.gate_proj.weight_scale": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.8.up_proj.weight": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.8.up_proj.weight_scale": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.80.down_proj.weight": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.80.down_proj.weight_scale": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.80.gate_proj.weight": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.80.gate_proj.weight_scale": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.80.up_proj.weight": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.80.up_proj.weight_scale": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.81.down_proj.weight": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.81.down_proj.weight_scale": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.81.gate_proj.weight": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.81.gate_proj.weight_scale": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.81.up_proj.weight": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.81.up_proj.weight_scale": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.82.down_proj.weight": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.82.down_proj.weight_scale": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.82.gate_proj.weight": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.82.gate_proj.weight_scale": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.82.up_proj.weight": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.82.up_proj.weight_scale": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.83.down_proj.weight": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.83.down_proj.weight_scale": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.83.gate_proj.weight": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.83.gate_proj.weight_scale": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.83.up_proj.weight": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.83.up_proj.weight_scale": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.84.down_proj.weight": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.84.down_proj.weight_scale": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.84.gate_proj.weight": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.84.gate_proj.weight_scale": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.84.up_proj.weight": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.84.up_proj.weight_scale": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.85.down_proj.weight": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.85.down_proj.weight_scale": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.85.gate_proj.weight": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.85.gate_proj.weight_scale": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.85.up_proj.weight": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.85.up_proj.weight_scale": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.86.down_proj.weight": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.86.down_proj.weight_scale": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.86.gate_proj.weight": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.86.gate_proj.weight_scale": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.86.up_proj.weight": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.86.up_proj.weight_scale": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.87.down_proj.weight": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.87.down_proj.weight_scale": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.87.gate_proj.weight": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.87.gate_proj.weight_scale": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.87.up_proj.weight": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.87.up_proj.weight_scale": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.88.down_proj.weight": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.88.down_proj.weight_scale": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.88.gate_proj.weight": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.88.gate_proj.weight_scale": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.88.up_proj.weight": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.88.up_proj.weight_scale": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.89.down_proj.weight": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.89.down_proj.weight_scale": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.89.gate_proj.weight": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.89.gate_proj.weight_scale": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.89.up_proj.weight": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.89.up_proj.weight_scale": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.9.down_proj.weight": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.9.down_proj.weight_scale": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.9.gate_proj.weight": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.9.gate_proj.weight_scale": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.9.up_proj.weight": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.9.up_proj.weight_scale": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.90.down_proj.weight": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.90.down_proj.weight_scale": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.90.gate_proj.weight": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.90.gate_proj.weight_scale": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.90.up_proj.weight": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.90.up_proj.weight_scale": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.91.down_proj.weight": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.91.down_proj.weight_scale": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.91.gate_proj.weight": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.91.gate_proj.weight_scale": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.91.up_proj.weight": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.91.up_proj.weight_scale": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.92.down_proj.weight": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.92.down_proj.weight_scale": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.92.gate_proj.weight": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.92.gate_proj.weight_scale": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.92.up_proj.weight": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.92.up_proj.weight_scale": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.93.down_proj.weight": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.93.down_proj.weight_scale": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.93.gate_proj.weight": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.93.gate_proj.weight_scale": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.93.up_proj.weight": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.93.up_proj.weight_scale": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.94.down_proj.weight": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.94.down_proj.weight_scale": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.94.gate_proj.weight": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.94.gate_proj.weight_scale": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.94.up_proj.weight": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.94.up_proj.weight_scale": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.95.down_proj.weight": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.95.down_proj.weight_scale": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.95.gate_proj.weight": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.95.gate_proj.weight_scale": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.95.up_proj.weight": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.95.up_proj.weight_scale": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.96.down_proj.weight": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.96.down_proj.weight_scale": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.96.gate_proj.weight": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.96.gate_proj.weight_scale": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.96.up_proj.weight": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.96.up_proj.weight_scale": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.97.down_proj.weight": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.97.down_proj.weight_scale": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.97.gate_proj.weight": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.97.gate_proj.weight_scale": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.97.up_proj.weight": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.97.up_proj.weight_scale": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.98.down_proj.weight": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.98.down_proj.weight_scale": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.98.gate_proj.weight": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.98.gate_proj.weight_scale": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.98.up_proj.weight": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.98.up_proj.weight_scale": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.99.down_proj.weight": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.99.down_proj.weight_scale": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.99.gate_proj.weight": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.99.gate_proj.weight_scale": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.99.up_proj.weight": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.99.up_proj.weight_scale": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.gate.e_score_correction_bias": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.gate.weight": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.shared_experts.down_proj.weight": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.shared_experts.down_proj.weight_scale": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.shared_experts.gate_proj.weight": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.shared_experts.gate_proj.weight_scale": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.shared_experts.up_proj.weight": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.shared_experts.up_proj.weight_scale": "model-00092-of-00092.safetensors",
+ "model.layers.91.post_attention_layernorm.weight": "model-00092-of-00092.safetensors",
+ "model.layers.91.self_attn.k_norm.weight": "model-00092-of-00092.safetensors",
+ "model.layers.91.self_attn.k_proj.bias": "model-00092-of-00092.safetensors",
+ "model.layers.91.self_attn.k_proj.weight": "model-00092-of-00092.safetensors",
+ "model.layers.91.self_attn.k_proj.weight_scale": "model-00092-of-00092.safetensors",
+ "model.layers.91.self_attn.o_proj.weight": "model-00092-of-00092.safetensors",
+ "model.layers.91.self_attn.o_proj.weight_scale": "model-00092-of-00092.safetensors",
+ "model.layers.91.self_attn.q_norm.weight": "model-00092-of-00092.safetensors",
+ "model.layers.91.self_attn.q_proj.bias": "model-00092-of-00092.safetensors",
+ "model.layers.91.self_attn.q_proj.weight": "model-00092-of-00092.safetensors",
+ "model.layers.91.self_attn.q_proj.weight_scale": "model-00092-of-00092.safetensors",
+ "model.layers.91.self_attn.v_proj.bias": "model-00092-of-00092.safetensors",
+ "model.layers.91.self_attn.v_proj.weight": "model-00092-of-00092.safetensors",
+ "model.layers.91.self_attn.v_proj.weight_scale": "model-00092-of-00092.safetensors",
+ "model.norm.weight": "model-00092-of-00092.safetensors"
+ },
+ "metadata": {
+ "total_size": 241145664
+ }
+}
\ No newline at end of file
diff --git a/tokenizer.json b/tokenizer.json
new file mode 100644
index 0000000000000000000000000000000000000000..43a71efad1ab3f7e4d66d1e48e7cc44f68f21f3a
--- /dev/null
+++ b/tokenizer.json
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:9340665016419c825c4bdabbcc9acc43b7ca2c68ce142724afa829abb1be5efd
+size 19970699
diff --git a/tokenizer_config.json b/tokenizer_config.json
new file mode 100644
index 0000000000000000000000000000000000000000..053f12c9b03d5acbcc921042ea0c87a6baa5d3f7
--- /dev/null
+++ b/tokenizer_config.json
@@ -0,0 +1,325 @@
+{
+ "added_tokens_decoder": {
+ "151329": {
+ "content": "<|endoftext|>",
+ "lstrip": false,
+ "normalized": false,
+ "rstrip": false,
+ "single_word": false,
+ "special": true
+ },
+ "151330": {
+ "content": "[MASK]",
+ "lstrip": false,
+ "normalized": false,
+ "rstrip": false,
+ "single_word": false,
+ "special": true
+ },
+ "151331": {
+ "content": "[gMASK]",
+ "lstrip": false,
+ "normalized": false,
+ "rstrip": false,
+ "single_word": false,
+ "special": true
+ },
+ "151332": {
+ "content": "[sMASK]",
+ "lstrip": false,
+ "normalized": false,
+ "rstrip": false,
+ "single_word": false,
+ "special": true
+ },
+ "151333": {
+ "content": "",
+ "lstrip": false,
+ "normalized": false,
+ "rstrip": false,
+ "single_word": false,
+ "special": true
+ },
+ "151334": {
+ "content": "",
+ "lstrip": false,
+ "normalized": false,
+ "rstrip": false,
+ "single_word": false,
+ "special": true
+ },
+ "151335": {
+ "content": "<|system|>",
+ "lstrip": false,
+ "normalized": false,
+ "rstrip": false,
+ "single_word": false,
+ "special": true
+ },
+ "151336": {
+ "content": "<|user|>",
+ "lstrip": false,
+ "normalized": false,
+ "rstrip": false,
+ "single_word": false,
+ "special": true
+ },
+ "151337": {
+ "content": "<|assistant|>",
+ "lstrip": false,
+ "normalized": false,
+ "rstrip": false,
+ "single_word": false,
+ "special": true
+ },
+ "151338": {
+ "content": "<|observation|>",
+ "lstrip": false,
+ "normalized": false,
+ "rstrip": false,
+ "single_word": false,
+ "special": true
+ },
+ "151339": {
+ "content": "<|begin_of_image|>",
+ "lstrip": false,
+ "normalized": false,
+ "rstrip": false,
+ "single_word": false,
+ "special": true
+ },
+ "151340": {
+ "content": "<|end_of_image|>",
+ "lstrip": false,
+ "normalized": false,
+ "rstrip": false,
+ "single_word": false,
+ "special": true
+ },
+ "151341": {
+ "content": "<|begin_of_video|>",
+ "lstrip": false,
+ "normalized": false,
+ "rstrip": false,
+ "single_word": false,
+ "special": true
+ },
+ "151342": {
+ "content": "<|end_of_video|>",
+ "lstrip": false,
+ "normalized": false,
+ "rstrip": false,
+ "single_word": false,
+ "special": true
+ },
+ "151343": {
+ "content": "<|begin_of_audio|>",
+ "lstrip": false,
+ "normalized": false,
+ "rstrip": false,
+ "single_word": false,
+ "special": true
+ },
+ "151344": {
+ "content": "<|end_of_audio|>",
+ "lstrip": false,
+ "normalized": false,
+ "rstrip": false,
+ "single_word": false,
+ "special": true
+ },
+ "151345": {
+ "content": "<|begin_of_transcription|>",
+ "lstrip": false,
+ "normalized": false,
+ "rstrip": false,
+ "single_word": false,
+ "special": true
+ },
+ "151346": {
+ "content": "<|end_of_transcription|>",
+ "lstrip": false,
+ "normalized": false,
+ "rstrip": false,
+ "single_word": false,
+ "special": true
+ },
+ "151347": {
+ "content": "<|code_prefix|>",
+ "lstrip": false,
+ "normalized": false,
+ "rstrip": false,
+ "single_word": false,
+ "special": true
+ },
+ "151348": {
+ "content": "<|code_middle|>",
+ "lstrip": false,
+ "normalized": false,
+ "rstrip": false,
+ "single_word": false,
+ "special": true
+ },
+ "151349": {
+ "content": "<|code_suffix|>",
+ "lstrip": false,
+ "normalized": false,
+ "rstrip": false,
+ "single_word": false,
+ "special": true
+ },
+ "151350": {
+ "content": "",
+ "lstrip": false,
+ "normalized": false,
+ "rstrip": false,
+ "single_word": false,
+ "special": false
+ },
+ "151351": {
+ "content": "",
+ "lstrip": false,
+ "normalized": false,
+ "rstrip": false,
+ "single_word": false,
+ "special": false
+ },
+ "151352": {
+ "content": "",
+ "lstrip": false,
+ "normalized": false,
+ "rstrip": false,
+ "single_word": false,
+ "special": false
+ },
+ "151353": {
+ "content": "",
+ "lstrip": false,
+ "normalized": false,
+ "rstrip": false,
+ "single_word": false,
+ "special": false
+ },
+ "151354": {
+ "content": "",
+ "lstrip": false,
+ "normalized": false,
+ "rstrip": false,
+ "single_word": false,
+ "special": false
+ },
+ "151355": {
+ "content": "",
+ "lstrip": false,
+ "normalized": false,
+ "rstrip": false,
+ "single_word": false,
+ "special": false
+ },
+ "151356": {
+ "content": "",
+ "lstrip": false,
+ "normalized": false,
+ "rstrip": false,
+ "single_word": false,
+ "special": false
+ },
+ "151357": {
+ "content": "",
+ "lstrip": false,
+ "normalized": false,
+ "rstrip": false,
+ "single_word": false,
+ "special": false
+ },
+ "151358": {
+ "content": "",
+ "lstrip": false,
+ "normalized": false,
+ "rstrip": false,
+ "single_word": false,
+ "special": false
+ },
+ "151359": {
+ "content": "",
+ "lstrip": false,
+ "normalized": false,
+ "rstrip": false,
+ "single_word": false,
+ "special": false
+ },
+ "151360": {
+ "content": "/nothink",
+ "lstrip": false,
+ "normalized": false,
+ "rstrip": false,
+ "single_word": false,
+ "special": true
+ },
+ "151361": {
+ "content": "<|begin_of_box|>",
+ "lstrip": false,
+ "normalized": false,
+ "rstrip": false,
+ "single_word": false,
+ "special": false
+ },
+ "151362": {
+ "content": "<|end_of_box|>",
+ "lstrip": false,
+ "normalized": false,
+ "rstrip": false,
+ "single_word": false,
+ "special": false
+ },
+ "151363": {
+ "content": "<|image|>",
+ "lstrip": false,
+ "normalized": false,
+ "rstrip": false,
+ "single_word": false,
+ "special": false
+ },
+ "151364": {
+ "content": "<|video|>",
+ "lstrip": false,
+ "normalized": false,
+ "rstrip": false,
+ "single_word": false,
+ "special": false
+ }
+ },
+ "additional_special_tokens": [
+ "<|endoftext|>",
+ "[MASK]",
+ "[gMASK]",
+ "[sMASK]",
+ "",
+ "",
+ "<|system|>",
+ "<|user|>",
+ "<|assistant|>",
+ "<|observation|>",
+ "<|begin_of_image|>",
+ "<|end_of_image|>",
+ "<|begin_of_video|>",
+ "<|end_of_video|>",
+ "<|begin_of_audio|>",
+ "<|end_of_audio|>",
+ "<|begin_of_transcription|>",
+ "<|end_of_transcription|>",
+ "<|code_prefix|>",
+ "<|code_middle|>",
+ "<|code_suffix|>",
+ "/nothink"
+ ],
+ "clean_up_tokenization_spaces": false,
+ "do_lower_case": false,
+ "eos_token": "<|endoftext|>",
+ "extra_special_tokens": {},
+ "model_max_length": 128000,
+ "pad_token": "<|endoftext|>",
+ "padding_side": "left",
+ "remove_space": false,
+ "tokenizer_class": "PreTrainedTokenizer"
+}